Added cflow algorithm (#47)

* Added cflow algorithm * added cflow reqs * changing default image size * revert image size and delete resume from checkpoint * removed reference to github * reducing batch size for training and inference * decreasing fiber batch size * Added cflow algorithm * added cflow reqs * changing default image size * revert image size and delete resume from checkpoint * removed reference to github * reducing batch size for training and inference * decreasing fiber batch size * reducing patience for quicker convergence * updating config file * fixing checkpoint issue, added normalization param * rolling back to resnet18 * perform metric computation on cpu * normalization on cpu * round performance comparison
openvinotoolkit · Jan 9, 2022 · 80a3de2 · 80a3de2
1 parent 2bae059
commit 80a3de2
Show file tree

Hide file tree

Showing 12 changed files with 594 additions and 11 deletions.
diff --git a/anomalib/core/callbacks/min_max_normalization.py b/anomalib/core/callbacks/min_max_normalization.py
@@ -73,11 +73,11 @@ def on_predict_batch_end(
     @staticmethod
     def _normalize_batch(outputs, pl_module):
         """Normalize a batch of predictions."""
-        stats = pl_module.min_max
+        stats = pl_module.min_max.cpu()
         outputs["pred_scores"] = normalize(
-            outputs["pred_scores"], pl_module.image_threshold.value, stats.min, stats.max
+            outputs["pred_scores"], pl_module.image_threshold.value.cpu(), stats.min, stats.max
         )
         if "anomaly_maps" in outputs.keys():
             outputs["anomaly_maps"] = normalize(
-                outputs["anomaly_maps"], pl_module.pixel_threshold.value, stats.min, stats.max
+                outputs["anomaly_maps"], pl_module.pixel_threshold.value.cpu(), stats.min, stats.max
             )
diff --git a/anomalib/core/model/anomaly_module.py b/anomalib/core/model/anomaly_module.py
@@ -48,19 +48,19 @@ def __init__(self, params: Union[DictConfig, ListConfig]):
         self.loss: Tensor
         self.callbacks: List[Callback]
 
-        self.image_threshold = AdaptiveThreshold(self.hparams.model.threshold.image_default)
+        self.image_threshold = AdaptiveThreshold(self.hparams.model.threshold.image_default).cpu()
         self.pixel_threshold = AdaptiveThreshold(self.hparams.model.threshold.pixel_default)
 
-        self.training_distribution = AnomalyScoreDistribution()
-        self.min_max = MinMax()
+        self.training_distribution = AnomalyScoreDistribution().cpu()
+        self.min_max = MinMax().cpu()
 
         self.model: nn.Module
 
         # metrics
         auroc = AUROC(num_classes=1, pos_label=1, compute_on_step=False)
         f1_score = F1(num_classes=1, compute_on_step=False)
-        self.image_metrics = MetricCollection([auroc, f1_score], prefix="image_")
-        self.pixel_metrics = self.image_metrics.clone(prefix="pixel_")
+        self.image_metrics = MetricCollection([auroc, f1_score], prefix="image_").cpu()
+        self.pixel_metrics = self.image_metrics.clone(prefix="pixel_").cpu()
 
     def forward(self, batch):  # pylint: disable=arguments-differ
         """Forward-pass input tensor to the module.
@@ -111,11 +111,13 @@ def test_step(self, batch, _):  # pylint: disable=arguments-differ
 
     def validation_step_end(self, val_step_outputs):  # pylint: disable=arguments-differ
         """Called at the end of each validation step."""
+        self._outputs_to_cpu(val_step_outputs)
         self._post_process(val_step_outputs)
         return val_step_outputs
 
     def test_step_end(self, test_step_outputs):  # pylint: disable=arguments-differ
         """Called at the end of each test step."""
+        self._outputs_to_cpu(test_step_outputs)
         self._post_process(test_step_outputs)
         return test_step_outputs
 
@@ -152,8 +154,10 @@ def _compute_adaptive_threshold(self, outputs):
 
     def _collect_outputs(self, image_metric, pixel_metric, outputs):
         for output in outputs:
+            image_metric.cpu()
             image_metric.update(output["pred_scores"], output["label"].int())
             if "mask" in output.keys() and "anomaly_maps" in output.keys():
+                pixel_metric.cpu()
                 pixel_metric.update(output["anomaly_maps"].flatten(), output["mask"].flatten().int())
 
     def _post_process(self, outputs):
@@ -163,6 +167,12 @@ def _post_process(self, outputs):
                 outputs["anomaly_maps"].reshape(outputs["anomaly_maps"].shape[0], -1).max(dim=1).values
             )
 
+    def _outputs_to_cpu(self, output):
+        # for output in outputs:
+        for key, value in output.items():
+            if isinstance(value, Tensor):
+                output[key] = value.cpu()
+
     def _log_metrics(self):
         """Log computed performance metrics."""
         self.log_dict(self.image_metrics)

diff --git a/anomalib/core/model/feature_extractor.py b/anomalib/core/model/feature_extractor.py
@@ -50,10 +50,17 @@ def __init__(self, backbone: nn.Module, layers: Iterable[str]):
         self.backbone = backbone
         self.layers = layers
         self._features = {layer: torch.empty(0) for layer in self.layers}
+        self.out_dims = []
 
         for layer_id in layers:
             layer = dict([*self.backbone.named_modules()])[layer_id]
             layer.register_forward_hook(self.get_features(layer_id))
+            # get output dimension of features if available
+            layer_modules = [*layer.modules()]
+            for idx in reversed(range(len(layer_modules))):
+                if hasattr(layer_modules[idx], "out_channels"):
+                    self.out_dims.append(layer_modules[idx].out_channels)
+                    break
 
     def get_features(self, layer_id: str) -> Callable:
         """Get layer features.

diff --git a/anomalib/models/__init__.py b/anomalib/models/__init__.py
@@ -47,7 +47,7 @@ def get_model(config: Union[DictConfig, ListConfig]) -> AnomalyModule:
         AnomalyModule: Anomaly Model
     """
     openvino_model_list: List[str] = ["stfpm"]
-    torch_model_list: List[str] = ["padim", "stfpm", "dfkde", "dfm", "patchcore"]
+    torch_model_list: List[str] = ["padim", "stfpm", "dfkde", "dfm", "patchcore", "cflow"]
     model: AnomalyModule
 
     if config.openvino:

diff --git a/anomalib/models/cflow/README.md b/anomalib/models/cflow/README.md
@@ -0,0 +1,3 @@
+# Real-Time  Unsupervised Anomaly Detection via Conditional Normalizing Flows
+
+This is the implementation of the [CW-AD](https://arxiv.org/pdf/2107.12571v1.pdf) paper.
diff --git a/anomalib/models/cflow/__init__.py b/anomalib/models/cflow/__init__.py
@@ -0,0 +1,18 @@
+"""Real-Time  Unsupervised Anomaly Detection via Conditional Normalizing Flows.
+
+[CW-AD](https://arxiv.org/pdf/2107.12571v1.pdf)
+"""
+
+# Copyright (C) 2020 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions
+# and limitations under the License.
diff --git a/anomalib/models/cflow/backbone.py b/anomalib/models/cflow/backbone.py
@@ -0,0 +1,100 @@
+"""Helper functions to create backbone model."""
+
+# Copyright (C) 2020 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions
+# and limitations under the License.
+
+import math
+
+import FrEIA.framework as Ff
+import FrEIA.modules as Fm
+import torch
+from FrEIA.framework.sequence_inn import SequenceINN
+from torch import nn
+
+
+def positional_encoding_2d(condition_vector: int, height: int, width: int) -> torch.Tensor:
+    """Creates embedding to store relative position of the feature vector using sine and cosine functions.
+
+    Args:
+        condition_vector (int): Length of the condition vector
+        height (int): H of the positions
+        width (int): W of the positions
+
+    Raises:
+        ValueError: Cannot generate encoding with conditional vector length not as multiple of 4
+
+    Returns:
+        torch.Tensor: condition_vector x HEIGHT x WIDTH position matrix
+    """
+    if condition_vector % 4 != 0:
+        raise ValueError(f"Cannot use sin/cos positional encoding with odd dimension (got dim={condition_vector})")
+    pos_encoding = torch.zeros(condition_vector, height, width)
+    # Each dimension use half of condition_vector
+    condition_vector = condition_vector // 2
+    div_term = torch.exp(torch.arange(0.0, condition_vector, 2) * -(math.log(1e4) / condition_vector))
+    pos_w = torch.arange(0.0, width).unsqueeze(1)
+    pos_h = torch.arange(0.0, height).unsqueeze(1)
+    pos_encoding[0:condition_vector:2, :, :] = (
+        torch.sin(pos_w * div_term).transpose(0, 1).unsqueeze(1).repeat(1, height, 1)
+    )
+    pos_encoding[1:condition_vector:2, :, :] = (
+        torch.cos(pos_w * div_term).transpose(0, 1).unsqueeze(1).repeat(1, height, 1)
+    )
+    pos_encoding[condition_vector::2, :, :] = (
+        torch.sin(pos_h * div_term).transpose(0, 1).unsqueeze(2).repeat(1, 1, width)
+    )
+    pos_encoding[condition_vector + 1 :: 2, :, :] = (
+        torch.cos(pos_h * div_term).transpose(0, 1).unsqueeze(2).repeat(1, 1, width)
+    )
+    return pos_encoding
+
+
+def subnet_fc(dims_in: int, dims_out: int):
+    """Subnetwork which predicts the affine coefficients.
+
+    Args:
+        dims_in (int): input dimensions
+        dims_out (int): output dimensions
+
+    Returns:
+        nn.Sequential: Feed-forward subnetwork
+    """
+    return nn.Sequential(nn.Linear(dims_in, 2 * dims_in), nn.ReLU(), nn.Linear(2 * dims_in, dims_out))
+
+
+def cflow_head(condition_vector: int, coupling_blocks: int, clamp_alpha: float, n_features: int) -> SequenceINN:
+    """Create invertible decoder network.
+
+    Args:
+        condition_vector (int): length of the condition vector
+        coupling_blocks (int): number of coupling blocks to build the decoder
+        clamp_alpha (float): clamping value to avoid exploding values
+        n_features (int): number of decoder features
+
+    Returns:
+        SequenceINN: decoder network block
+    """
+    coder = Ff.SequenceINN(n_features)
+    print("CNF coder:", n_features)
+    for _ in range(coupling_blocks):
+        coder.append(
+            Fm.AllInOneBlock,
+            cond=0,
+            cond_shape=(condition_vector,),
+            subnet_constructor=subnet_fc,
+            affine_clamping=clamp_alpha,
+            global_affine_type="SOFTPLUS",
+            permute_soft=True,
+        )
+    return coder
diff --git a/anomalib/models/cflow/config.yaml b/anomalib/models/cflow/config.yaml
@@ -0,0 +1,96 @@
+dataset:
+  name: mvtec
+  format: mvtec
+  path: ./datasets/MVTec
+  url: ftp://guest:GU.205dldo@ftp.softronics.ch/mvtec_anomaly_detection/mvtec_anomaly_detection.tar.xz
+  category: leather
+  task: segmentation
+  label_format: None
+  image_size: 256
+  train_batch_size: 16
+  test_batch_size: 16
+  inference_batch_size: 16
+  fiber_batch_size: 64
+  num_workers: 36
+
+model:
+  name: cflow
+  backbone: resnet18
+  layers:
+    - layer2
+    - layer3
+    - layer4
+  decoder: freia-cflow
+  condition_vector: 128
+  coupling_blocks: 8
+  clamp_alpha: 1.9
+  lr: 0.0001
+  early_stopping:
+    patience: 3
+    metric: pixel_AUROC
+    mode: max
+  normalization_method: min_max # options: [null, min_max, cdf]
+  threshold:
+    image_default: 0
+    pixel_default: 0
+    adaptive: true
+
+project:
+  seed: 0
+  path: ./results
+  log_images_to: [local]
+  logger: false
+  save_to_csv: false
+
+# PL Trainer Args. Don't add extra parameter here.
+trainer:
+  accelerator: null
+  accumulate_grad_batches: 1
+  amp_backend: native
+  amp_level: O2
+  auto_lr_find: false
+  auto_scale_batch_size: false
+  auto_select_gpus: false
+  benchmark: false
+  check_val_every_n_epoch: 1
+  checkpoint_callback: true
+  default_root_dir: null
+  deterministic: true
+  distributed_backend: null
+  fast_dev_run: false
+  flush_logs_every_n_steps: 100
+  gpus: 1
+  gradient_clip_val: 0
+  limit_predict_batches: 1.0
+  limit_test_batches: 1.0
+  limit_train_batches: 1.0
+  limit_val_batches: 1.0
+  log_every_n_steps: 50
+  log_gpu_memory: null
+  max_epochs: 50
+  max_steps: null
+  min_epochs: null
+  min_steps: null
+  move_metrics_to_cpu: false
+  multiple_trainloader_mode: max_size_cycle
+  num_nodes: 1
+  num_processes: 1
+  num_sanity_val_steps: 0
+  overfit_batches: 0.0
+  plugins: null
+  precision: 32
+  prepare_data_per_node: true
+  process_position: 0
+  profiler: null
+  progress_bar_refresh_rate: null
+  reload_dataloaders_every_epoch: false
+  replace_sampler_ddp: true
+  stochastic_weight_avg: false
+  sync_batchnorm: false
+  terminate_on_nan: false
+  tpu_cores: null
+  track_grad_norm: -1
+  truncated_bptt_steps: null
+  val_check_interval: 1.0
+  weights_save_path: null
+  weights_summary: top