open-edge-platform
diff --git a/‎examples/api/02_data/mvtec_loco.py‎
Lines changed: 71 additions & 0 deletions b/‎examples/api/02_data/mvtec_loco.py‎
Lines changed: 71 additions & 0 deletions
diff --git a/‎examples/configs/data/mvtec_loco.yaml‎
Lines changed: 12 additions & 0 deletions b/‎examples/configs/data/mvtec_loco.yaml‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎src/anomalib/data/__init__.py‎
Lines changed: 4 additions & 1 deletion b/‎src/anomalib/data/__init__.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎src/anomalib/data/datamodules/image/__init__.py‎
Lines changed: 18 additions & 9 deletions b/‎src/anomalib/data/datamodules/image/__init__.py‎
Lines changed: 18 additions & 9 deletions
diff --git a/‎src/anomalib/data/datamodules/image/mvtec_loco.py‎
Lines changed: 190 additions & 0 deletions b/‎src/anomalib/data/datamodules/image/mvtec_loco.py‎
Lines changed: 190 additions & 0 deletions
diff --git a/‎src/anomalib/data/datasets/image/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎src/anomalib/data/datasets/image/__init__.py‎
Lines changed: 3 additions & 0 deletions
@@ -0,0 +1,71 @@
+"""Example showing how to use the MVTec LOCO dataset with Anomalib.
+
+MVTec LOCO is a dataset for detecting logical and structural anomalies in images.
+It contains 5 categories of industrial objects with various types of defects.
+"""
+
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from anomalib.data import MVTecLOCO
+
+# 1. Basic Usage
+# Load a specific category with default settings
+datamodule = MVTecLOCO(
+    root="./datasets/MVTec_LOCO",
+    category="breakfast_box",
+)
+datamodule.prepare_data()
+datamodule.setup()
+i, data = next(enumerate(datamodule.test_dataloader()))
+
+
+# 2. Advanced Configuration
+# Customize data loading and preprocessing
+datamodule = MVTecLOCO(
+    root="./datasets/MVTec_LOCO",
+    category="juice_bottle",
+    train_batch_size=32,
+    eval_batch_size=32,
+    num_workers=8,
+    val_split_mode="from_test",  # Create validation set from test set
+    val_split_ratio=0.5,  # Use 50% of test set for validation
+)
+
+# 3. Using Multiple Categories
+# Train on multiple categories (if supported by the model)
+for category in ["breakfast_box", "juice_bottle", "pushpins"]:
+    category_data = MVTecLOCO(
+        root="./datasets/MVTec_LOCO",
+        category=category,
+    )
+    # Use category_data with your model...
+
+# 4. Accessing Dataset Properties
+# Get information about the dataset
+print(f"Number of training samples: {len(datamodule.train_data)}")
+print(f"Number of validation samples: {len(datamodule.val_data)}")
+print(f"Number of test samples: {len(datamodule.test_data)}")
+
+# 5. Working with Data Samples
+# Get a sample from the dataset
+sample = datamodule.train_data[0]
+print("\nSample keys:", list(sample.__dict__.keys()))
+print("Image shape:", sample.image.shape if sample.image is not None else None)
+print("Mask shape:", sample.gt_mask.shape if sample.gt_mask is not None else None)
+print("Label:", sample.gt_label)
+
+# 6. Using with a Model
+# Example of using the datamodule with a model
+from anomalib.engine import Engine  # noqa: E402
+from anomalib.models import Patchcore  # noqa: E402
+
+# Initialize model
+model = Patchcore(backbone="wide_resnet50_2", layers=["layer3"], coreset_sampling_ratio=0.1)
+
+# Train using the Engine
+engine = Engine()
+engine.fit(model=model, datamodule=datamodule)
+
+# Get predictions
+predictions = engine.predict(model=model, datamodule=datamodule)
@@ -0,0 +1,12 @@
+class_path: anomalib.data.MVTecLOCO
+init_args:
+  root: ./datasets/MVTec_LOCO
+  category: breakfast_box
+  train_batch_size: 32
+  eval_batch_size: 32
+  num_workers: 8
+  test_split_mode: from_dir
+  test_split_ratio: 0.2
+  val_split_mode: same_as_test
+  val_split_ratio: 0.5
+  seed: null
@@ -49,7 +49,7 @@
 # Datamodules
 from .datamodules.base import AnomalibDataModule
 from .datamodules.depth import DepthDataFormat, Folder3D, MVTec3D
-from .datamodules.image import BTech, Datumaro, Folder, ImageDataFormat, Kolektor, MVTec, MVTecAD, Visa
+from .datamodules.image import BTech, Datumaro, Folder, ImageDataFormat, Kolektor, MVTec, MVTecAD, MVTecLOCO, Visa
 from .datamodules.video import Avenue, ShanghaiTech, UCSDped, VideoDataFormat
 
 # Datasets
@@ -61,6 +61,7 @@
     FolderDataset,
     KolektorDataset,
     MVTecADDataset,
+    MVTecLOCODataset,
     VisaDataset,
 )
 from .datasets.video import AvenueDataset, ShanghaiTechDataset, UCSDpedDataset
@@ -163,6 +164,8 @@ def get_datamodule(config: DictConfig | ListConfig | dict) -> AnomalibDataModule
     "MVTec",  # Include MVTec for backward compatibility
     "MVTecAD",
     "MVTecADDataset",
+    "MVTecLOCO",
+    "MVTecLOCODataset",
     "Visa",
     "VisaDataset",
     # Video
 
@@ -8,6 +8,7 @@
 - ``Folder``: Custom folder structure with normal/abnormal images
 - ``Kolektor``: Kolektor Surface-Defect Dataset
 - ``MVTecAD``: MVTec Anomaly Detection Dataset
+- ``MVTecLOCO``: MVTec LOCO Dataset with logical and structural anomalies
 - ``Visa``: Visual Anomaly Dataset
 
 Example:
@@ -29,23 +30,29 @@
 from .datumaro import Datumaro
 from .folder import Folder
 from .kolektor import Kolektor
+from .mvtec_loco import MVTecLOCO
 from .mvtecad import MVTec, MVTecAD
 from .visa import Visa
 
 
 class ImageDataFormat(str, Enum):
     """Supported Image Dataset Types.
 
-    The following dataset formats are supported:
+        The following dataset formats are supported:
 
-    - ``BTECH``: BTech Surface Defect Dataset
-    - ``DATUMARO``: Dataset in Datumaro format
-    - ``FOLDER``: Custom folder structure
-    - ``FOLDER_3D``: Custom folder structure for 3D images
-    - ``KOLEKTOR``: Kolektor Surface-Defect Dataset
-    - ``MVTEC_AD``: MVTec AD Dataset
-    - ``MVTEC_3D``: MVTec 3D AD Dataset
-    - ``VISA``: Visual Anomaly Dataset
+        - ``BTECH``: BTech Surface Defect Dataset
+        - ``DATUMARO``: Dataset in Datumaro format
+        - ``FOLDER``: Custom folder structure
+        - ``FOLDER_3D``: Custom folder structure for 3D images
+        - ``KOLEKTOR``: Kolektor Surface-Defect Dataset
+        - ``MVTEC_AD``: MVTec AD Dataset
+        - ``MVTEC_3D``: MVTec 3D AD Dataset
+    <<<<<<< HEAD
+        - ``MVTEC_LOCO``: MVTec LOCO Dataset
+        - ``VISA``: Visual Inspection for Steel Anomaly Dataset
+    =======
+        - ``VISA``: Visual Anomaly Dataset
+    >>>>>>> b5456978dd2e513cfdd1e4c2aedce0286050ba80
     """
 
     BTECH = "btech"
@@ -55,6 +62,7 @@ class ImageDataFormat(str, Enum):
     KOLEKTOR = "kolektor"
     MVTEC_AD = "mvtecad"
     MVTEC_3D = "mvtec_3d"
+    MVTEC_LOCO = "mvtec_loco"
     VISA = "visa"
 
 
@@ -65,5 +73,6 @@ class ImageDataFormat(str, Enum):
     "Kolektor",
     "MVTecAD",
     "MVTec",  # Include both for backward compatibility
+    "MVTecLOCO",
     "Visa",
 ]
@@ -0,0 +1,190 @@
+"""MVTec LOCO Data Module.
+
+This module provides a PyTorch Lightning DataModule for the MVTec LOCO dataset. The
+dataset contains 5 categories of industrial objects with both normal and
+anomalous samples. Each category includes RGB images and pixel-level ground truth
+masks for anomaly segmentation.
+
+The dataset distinguishes between structural anomalies (local defects) and
+logical anomalies (global defects).
+
+Example:
+    Create a MVTec LOCO datamodule::
+
+        >>> from anomalib.data import MVTecLOCO
+        >>> datamodule = MVTecLOCO(
+        ...     root="./datasets/MVTec_LOCO",
+        ...     category="breakfast_box"
+        ... )
+
+Notes:
+    The dataset will be automatically downloaded and converted to the required
+    format when first used. The directory structure after preparation will be::
+
+        datasets/
+        └── MVTec_LOCO/
+            ├── breakfast_box/
+            ├── juice_bottle/
+            └── ...
+
+License:
+    MVTec LOCO dataset is released under the Creative Commons
+    Attribution-NonCommercial-ShareAlike 4.0 International License
+    (CC BY-NC-SA 4.0).
+    https://creativecommons.org/licenses/by-nc-sa/4.0/
+
+Reference:
+    Bergmann, P., Fauser, M., Sattlegger, D., & Steger, C. (2022).
+    MVTec LOCO - A Dataset for Detecting Logical Anomalies in Images.
+    In IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR),
+    2022.
+"""
+
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import logging
+from pathlib import Path
+
+from torchvision.transforms.v2 import Transform
+
+from anomalib.data.datamodules.base.image import AnomalibDataModule
+from anomalib.data.datasets.image.mvtec_loco import MVTecLOCODataset
+from anomalib.data.utils import Split, TestSplitMode, ValSplitMode
+
+logger = logging.getLogger(__name__)
+
+
+class MVTecLOCO(AnomalibDataModule):
+    """MVTec LOCO Datamodule.
+
+    Args:
+        root (Path | str): Path to the root of the dataset.
+            Defaults to ``"./datasets/MVTec_LOCO"``.
+        category (str): Category of the MVTec LOCO dataset (e.g. ``"breakfast_box"`` or
+            ``"juice_bottle"``). Defaults to ``"breakfast_box"``.
+        train_batch_size (int, optional): Training batch size.
+            Defaults to ``32``.
+        eval_batch_size (int, optional): Test batch size.
+            Defaults to ``32``.
+        num_workers (int, optional): Number of workers.
+            Defaults to ``8``.
+        train_augmentations (Transform | None): Augmentations to apply to the training images
+            Defaults to ``None``.
+        val_augmentations (Transform | None): Augmentations to apply to the validation images.
+            Defaults to ``None``.
+        test_augmentations (Transform | None): Augmentations to apply to the test images.
+            Defaults to ``None``.
+        augmentations (Transform | None): General augmentations to apply if stage-specific
+            augmentations are not provided.
+        test_split_mode (TestSplitMode): Method to create test set.
+            Defaults to ``TestSplitMode.FROM_DIR``.
+        test_split_ratio (float): Fraction of data to use for testing.
+            Defaults to ``0.2``.
+        val_split_mode (ValSplitMode): Method to create validation set.
+            Defaults to ``ValSplitMode.SAME_AS_TEST``.
+        val_split_ratio (float): Fraction of data to use for validation.
+            Defaults to ``0.5``.
+        seed (int | None, optional): Seed for reproducibility.
+            Defaults to ``None``.
+
+    Example:
+        Create MVTec LOCO datamodule with default settings::
+
+            >>> datamodule = MVTecLOCO()
+            >>> datamodule.setup()
+            >>> i, data = next(enumerate(datamodule.train_dataloader()))
+            >>> data.keys()
+            dict_keys(['image_path', 'label', 'image', 'mask_path', 'mask'])
+
+            >>> data["image"].shape
+            torch.Size([32, 3, 256, 256])
+
+        Change the category::
+
+            >>> datamodule = MVTecLOCO(category="juice_bottle")
+
+        Create validation set from test data::
+
+            >>> datamodule = MVTecLOCO(
+            ...     val_split_mode=ValSplitMode.FROM_TEST,
+            ...     val_split_ratio=0.1
+            ... )
+
+        Create synthetic validation set::
+
+            >>> datamodule = MVTecLOCO(
+            ...     val_split_mode=ValSplitMode.SYNTHETIC,
+            ...     val_split_ratio=0.2
+            ... )
+    """
+
+    def __init__(
+        self,
+        root: Path | str = "./datasets/MVTec_LOCO",
+        category: str = "breakfast_box",
+        train_batch_size: int = 32,
+        eval_batch_size: int = 32,
+        num_workers: int = 8,
+        train_augmentations: Transform | None = None,
+        val_augmentations: Transform | None = None,
+        test_augmentations: Transform | None = None,
+        augmentations: Transform | None = None,
+        test_split_mode: TestSplitMode | str | None = None,
+        test_split_ratio: float | None = None,
+        val_split_mode: ValSplitMode | str | None = None,
+        val_split_ratio: float | None = None,
+        seed: int | None = None,
+    ) -> None:
+        super().__init__(
+            train_batch_size=train_batch_size,
+            eval_batch_size=eval_batch_size,
+            num_workers=num_workers,
+            train_augmentations=train_augmentations,
+            val_augmentations=val_augmentations,
+            test_augmentations=test_augmentations,
+            augmentations=augmentations,
+            test_split_mode=test_split_mode,
+            test_split_ratio=test_split_ratio,
+            val_split_mode=val_split_mode,
+            val_split_ratio=val_split_ratio,
+            seed=seed,
+        )
+
+        self.root = Path(root)
+        self.category = category
+
+    def _setup(self, _stage: str | None = None) -> None:
+        """Set up the datasets and perform dynamic subset splitting.
+
+        This method may be overridden in subclass for custom splitting behaviour.
+
+        Note:
+            The stage argument is not used here. This is because, for a given
+            instance of an AnomalibDataModule subclass, all three subsets are
+            created at the first call of setup(). This is to accommodate the
+            subset splitting behaviour of anomaly tasks, where the validation set
+            is usually extracted from the test set, and the test set must
+            therefore be created as early as the `fit` stage.
+        """
+        # MVTec LOCO provides a training set that contains only normal images.
+        self.train_data = MVTecLOCODataset(
+            split=Split.TRAIN,
+            root=self.root,
+            category=self.category,
+        )
+
+        # MVTec LOCO provides a validation set that contains only normal images.
+        self.val_data = MVTecLOCODataset(
+            split=Split.VAL,
+            root=self.root,
+            category=self.category,
+        )
+
+        # MVTec LOCO provides a test set that contains both normal and anomalous images.
+        # Anomalous images are further divided into structural and logical anomalies.
+        self.test_data = MVTecLOCODataset(
+            split=Split.TEST,
+            root=self.root,
+            category=self.category,
+        )
@@ -8,6 +8,7 @@
 - ``FolderDataset``: Custom dataset from folder structure
 - ``KolektorDataset``: Kolektor surface defect dataset
 - ``MVTecADDataset``: MVTec AD dataset with industrial objects
+- ``MVTecLOCODataset``: MVTec LOCO dataset with logical and structural anomalies
 - ``VisaDataset``: Visual Anomaly dataset
 
 Example:
@@ -26,6 +27,7 @@
 from .datumaro import DatumaroDataset
 from .folder import FolderDataset
 from .kolektor import KolektorDataset
+from .mvtec_loco import MVTecLOCODataset
 from .mvtecad import MVTecADDataset, MVTecDataset
 from .visa import VisaDataset
 
@@ -36,5 +38,6 @@
     "KolektorDataset",
     "MVTecDataset",
     "MVTecADDataset",
+    "MVTecLOCODataset",
     "VisaDataset",
 ]