MCHAD

Multi Class Hypersphere Anomaly Detection (MCHAD) can be seen as a multi-class generalization of Deep One-Class Learning, where there are several centers \(\{\mu_1, \mu_2, ..., \mu_y\}\) in the output space of the model, one for each class. During training, the representation \(f_{\theta}(x)\) from class \(y\) is drawn towards the corresponding center \(\mu_y\).

In contrast to Class Anchor Clustering, the position of the class-centers can be learned, and the dimensionality of the output space can be chosen freely. Also, the method is able to incorporate outliers into the training. On the downside, MCHAD has more hyperparameters.

Here, we train the model for 10 epochs on the CIFAR10 dataset, using a backbone pre-trained on the \(32 \times 32\) resized version of the ImageNet as a foundation. We use the TinyImages300k as training outlier data.

You can run this example with:

python examples/loss/supervised/mchad.py

 import torch
 from torch.optim.lr_scheduler import CosineAnnealingLR
 from torch.optim import Adam
 from torch.utils.data import DataLoader, random_split
 from torchmetrics import Accuracy
 from torchvision.datasets import CIFAR10
 from tqdm import tqdm
 import math

 from pytorch_ood.dataset.img import Textures, TinyImages300k
 from pytorch_ood.loss import MCHADLoss
 from pytorch_ood.model import WideResNet
 from pytorch_ood.utils import OODMetrics, ToUnknown, fix_random_seed, is_known

 fix_random_seed(123)

 data_root = "data"
 n_epochs = 10
 device = "cuda:0"
 embedding_dim = 7  # dimensionality of output space
 margin = math.sqrt(embedding_dim)
 batch_size = 256

 trans = WideResNet.transform_for("imagenet32-nocifar")

 # setup IN training data
 data_in_train = CIFAR10(root=data_root, train=True, download=True, transform=trans)

 # setup OOD training data, same size as IN training data
 tiny300k = TinyImages300k(
     root=data_root, download=True, transform=trans, target_transform=ToUnknown()
 )

 # setup IN test data
 data_in_test = CIFAR10(root=data_root, train=False, transform=trans)

 # setup OOD test data, use ToUnknown() to mark labels as OOD
 data_out_test = Textures(
     root=data_root, download=True, transform=trans, target_transform=ToUnknown()
 )


 # create data loaders
 test_loader = DataLoader(
     data_in_test + data_out_test, batch_size=batch_size, num_workers=16
 )

 data_out_train, _ = random_split(
     tiny300k, [len(data_in_train), len(tiny300k) - len(data_in_train)]
 )
 train_loader = DataLoader(
     data_in_train + data_out_train, batch_size=batch_size, shuffle=True, num_workers=16
 )

Create DNN, pretrained on the imagenet excluding cifar10 classes. We have to replace the final layer to match the number of classes.

 model = WideResNet(num_classes=1000, pretrained="imagenet32-nocifar")
 model.fc = torch.nn.Linear(model.fc.in_features, embedding_dim)
 model.to(device)

 opti = Adam(model.parameters())
 criterion = MCHADLoss(
     n_classes=10, n_dim=embedding_dim, weight_oe=0.01, weight_center=2, margin=margin
 ).to(device)
 scheduler = CosineAnnealingLR(opti, T_max=n_epochs * len(train_loader))

Define a function that evaluates the model

 def test():
     metrics = OODMetrics()
     acc = Accuracy(num_classes=10)

     model.eval()

     with torch.no_grad(), tqdm(test_loader, desc="Testing") as bar:
         for x, y in bar:
             # calculate embeddings
             z = model(x.to(device))
             # calculate the distance of each embedding to each center
             distances = criterion.distance(z).cpu()
             metrics.update(distances.min(dim=1).values, y)
             known = is_known(y)
             if known.any():
                 acc.update(distances[known].min(dim=1).indices, y[known])

     print(metrics.compute())
     print(f"Accuracy: {acc.compute().item():.2%}")
     model.train()

Start training

 for epoch in range(n_epochs):
     print(f"Epoch {epoch}")
     loss_ema = None

     with tqdm(train_loader, desc=f"Epoch {epoch}") as bar:
         for x, y in bar:
             # calculate embeddings
             z = model(x.to(device))
             # calculate the distance of each embedding to each center
             distances = criterion.distance(z)
             # calculate MCHAD loss, based on distances to centers
             loss = criterion(distances, y.cuda())
             opti.zero_grad()
             loss.backward()
             opti.step()
             scheduler.step()

             loss_ema = (
                 loss.item() if not loss_ema else 0.99 * loss_ema + 0.01 * loss.item()
             )
             bar.set_postfix_str(
                 f"loss: {loss_ema:.3f} lr: {scheduler.get_last_lr()[0]:.6f}"
             )

     test()

     # create new random split
     data_out_train, _ = random_split(
         tiny300k, [len(data_in_train), len(tiny300k) - len(data_in_train)]
     )
     train_loader = DataLoader(
         data_in_train + data_out_train,
         batch_size=batch_size,
         shuffle=True,
         num_workers=16,
     )

Gallery generated by Sphinx-Gallery