Spaces:

kengboon
/

anomaly-detection

Running

App Files Files

KB Teo commited on Jan 31, 2024

Commit

098c98c

1 Parent(s): 1c527f9

Create space

Browse files

Files changed (6) hide show

README.md +3 -3
app.py +63 -0
inference/openvino/__init__.py +1 -0
inference/openvino/ov_infer.py +220 -0
inference/openvino/utils.py +79 -0
requirements.txt +5 -0

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
-title: AD Anomalib
-emoji: 📉
-colorFrom: blue
 colorTo: yellow
 sdk: gradio
 sdk_version: 4.16.0

 ---
+title: Anomaly Detection
+emoji: 🏭
+colorFrom: red
 colorTo: yellow
 sdk: gradio
 sdk_version: 4.16.0

app.py ADDED Viewed

	@@ -0,0 +1,63 @@

+from typing import *
+import importlib
+from pathlib import Path
+import cv2
+import gradio as gr
+import numpy as np
+available_modes = []
+inferencer = None
+last_model_path: str = None
+if importlib.util.find_spec("openvino"):
+    available_modes.append("OpenVINO")
+    from inference.openvino import OpenVINOInferencer
+    def predict_openvino(
+            image: Union[str, Path, np.ndarray],
+            model_path: Union[str, Path],
+            device: str) -> Dict[str, np.ndarray]:
+        global inferencer, last_model_path
+        if not isinstance(inferencer, OpenVINOInferencer) or last_model_path != str(model_path):
+            inferencer = OpenVINOInferencer(
+                path = model_path,
+                device=device.upper()
+            )
+            last_model_path = str(model_path)
+        return inferencer(image)
+def draw_contour(image, mask, color=(255,0,0), thickness=3):
+    contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
+    return cv2.drawContours(image.copy(), contours, -1, color, thickness)
+def convert_to_heatmap(heatmap):
+    heatmap = cv2.applyColorMap((heatmap*255).astype("uint8"), cv2.COLORMAP_HSV)
+    return heatmap
+def predict(image, device, model_dir):
+    outputs = predict_openvino(image, model_dir, device)
+    out_image = draw_contour(image, outputs["pred_mask"])
+    heatmap = convert_to_heatmap(outputs["anomaly_map"])
+    return out_image, heatmap
+def launch():
+    input_image = gr.Image(label="Input image")
+    devices = gr.Radio(
+        label="Device",
+        choices=["AUTO", "CPU", "CUDA"],
+        value="CPU",
+        interactive=False
+    )
+    output_image = gr.Image(label="Output image")
+    output_heatmap = gr.Image(label="Heatmap"),
+    model = gr.Text(label="Model", interactive=False, value="models/default")
+    intf = gr.Interface(
+        title="Anomaly Detection",
+        fn=predict,
+        inputs=[input_image, devices, model],
+        outputs=[output_image, output_heatmap]
+    )
+    intf.launch()
+if __name__ == "__main__":
+    launch()

inference/openvino/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .ov_infer import OpenVINOInferencer

inference/openvino/ov_infer.py ADDED Viewed

	@@ -0,0 +1,220 @@

+from typing import *
+from pathlib import Path
+import importlib
+import albumentations as A
+import cv2
+from omegaconf import DictConfig, OmegaConf
+import numpy as np
+from .utils import read_image, standardize, normalize_cdf, normalize_min_max, get_boxes
+if importlib.util.find_spec("openvino") is not None:
+    import openvino as ov
+else:
+    raise ImportError("OpenVINO is not installed.")
+class OpenVINOInferencer():
+    """For perform inference with OpenVINO.
+    Args:
+        path (str | Path): Folder path to exported OpenVINO model. Must contains
+            model.xml, model.bin, and metadata.json.
+        device (str): Device to run inference on. Defaults to "AUTO".
+        cache_dir (str | Path): Cache directory for OpenVINO
+    """
+    def __init__(self,
+                 path: Union[str, Path],
+                 device: str="AUTO",
+                 cache_dir: Union[str, Path, None]=None
+                 ) -> None:
+        if isinstance(path, str):
+            path = Path(path)
+        self.model = self._load_model(path, device, cache_dir)
+        self.metadata = self._load_metadata(path)
+        # Note: Transformation require Albumentations package
+        self.transform = A.from_dict(self.metadata["transform"])
+        self.metadata["expand_offset"] = self._get_expand_offset(self.transform)
+        # Record input & output blob (key)
+        self.metadata["input_blob"] = self.model.input(0).get_names().pop()
+        self.metadata["output_blob"] = self.model.output(0).get_names().pop()
+    def _load_model(self, path: Path, device: str, cache_dir: Union[str, Path, None]) -> ov.CompiledModel:
+        xml_path = path / "model.xml"
+        bin_path = path / "model.bin"
+        ov_core = ov.Core()
+        model = ov_core.read_model(xml_path, bin_path)
+        # Create cache directory
+        if cache_dir is None:
+            cache_dir = "cache"
+        if isinstance(cache_dir, str):
+            cache_dir = Path(cache_dir)
+        cache_dir.mkdir(parents=True, exist_ok=True)
+        ov_core.set_property({"CACHE_DIR": cache_dir})
+        model = ov_core.compile_model(model=model, device_name=device.upper())
+        return model
+    def _load_metadata(self, path: Path) -> DictConfig:
+        metadata = path / "metadata.json"
+        metadata = OmegaConf.load(metadata)
+        metadata = cast(DictConfig, metadata)
+        return metadata
+    def _get_expand_offset(self, transform):
+        is_center_cropped = False
+        for t in reversed(transform.transforms):
+            if isinstance(t, A.CenterCrop):
+                is_center_cropped = True
+                cropped_h = t.height
+                cropped_w = t.width
+            elif isinstance(t, A.Resize) and is_center_cropped:
+                return (t.height - cropped_h) // 2, (t.width - cropped_w) // 2
+    def predict(self, image: Union[str, Path, np.ndarray]) -> Dict[str, np.ndarray]:
+        if isinstance(image, (str, Path)):
+            image = read_image(image)
+        # Record input image size
+        self.metadata["image_shape"] = image.shape[:2]
+        inputs = self._pre_process(image, self.transform)
+        predictions = self.model(inputs)
+        outputs = self._post_processs(predictions, self.metadata)
+        outputs.update({"image": image})
+        return outputs
+    def __call__(self, image: Union[str, Path, np.ndarray]) -> Dict[str, np.ndarray]:
+        return self.predict(image)
+    def _pre_process(self, image: np.ndarray, transform=None) -> np.ndarray:
+        if transform is not None:
+            image = transform(image=image)["image"]
+        if len(image.shape) == 3:
+            # Add batch_size axis
+            image = np.expand_dims(image, axis=0)
+        if image.shape[3] == 3:
+            # Transpose the color_channel axis
+            # Expected shape: [b, c, h, w]
+            image = image.transpose(0, 3, 1, 2)
+        return image
+    def _post_processs(self, predictions: np.ndarray, metadata: DictConfig) -> Dict[str, np.ndarray]:
+        predictions = predictions[metadata["output_blob"]]
+        anomaly_map: np.ndarray = None
+        pred_label: float = None
+        pred_mask: float = None
+        if metadata["task"] == "classification":
+            pred_score = predictions
+        else:
+            anomaly_map = predictions.squeeze()
+            pred_score = anomaly_map.reshape(-1).max()
+        if "image_threshold" in metadata:
+            # Assign anomalous label to predictions with score >= threshold
+            pred_label = pred_score >= metadata["image_threshold"]
+        if metadata["task"] == "classification":
+            _, pred_score = self._normalize(pred_scores=pred_score, metadata=metadata)
+        else:
+            if "pixel_threshold" in metadata:
+                pred_mask = (anomaly_map >= metadata["pixel_threshold"]).astype(np.uint8)
+            anomaly_map, pred_score = self._normalize(
+                pred_scores=pred_score,
+                metadata=metadata,
+                anomaly_map=anomaly_map
+            )
+            if "image_shape" in metadata and anomaly_map.shape != metadata["image_shape"]:
+                if "expand_offset" in metadata and metadata["expand_offset"] is not None:
+                    anomaly_map = self._expand(anomaly_map, metadata["expand_offset"][0], metadata["expand_offset"][1])
+                    pred_mask = self._expand(pred_mask, metadata["expand_offset"][0], metadata["expand_offset"][1])
+                h, w = metadata["image_shape"] # Fix: cv2.resize take (w, h) as argument
+                anomaly_map = cv2.resize(anomaly_map, (w, h))
+                if pred_mask is not None:
+                    pred_mask = cv2.resize(pred_mask, (w, h))
+        if metadata["task"] == "detection":
+            pred_boxes = get_boxes(pred_mask)
+            box_labels = np.ones(pred_boxes.shape[0])
+        else:
+            pred_boxes: np.ndarray | None = None
+            box_labels: np.ndarray | None = None
+        return {
+            "anomaly_map": anomaly_map,
+            "pred_label": pred_label,
+            "pred_score": pred_score,
+            "pred_mask": pred_mask,
+            "pred_boxes": pred_boxes,
+            "box_labels": box_labels
+        }
+    @staticmethod
+    def _expand(map, offset_h, offset_w):
+        h, w = map.shape
+        if map is not None:
+            expanded_map = np.zeros((h + offset_h * 2, w + offset_w * 2), dtype=map.dtype)
+            expanded_map[offset_h:offset_h+h, offset_w:offset_w+w] = map
+            return expanded_map
+    @staticmethod
+    def _normalize(
+        pred_scores: np.float32,
+        metadata: DictConfig,
+        anomaly_map: np.ndarray | None = None
+        ) -> Tuple[Union[np.ndarray, None], float]:
+        # Min-max normalization
+        if "min" in metadata and "max" in metadata:
+            if anomaly_map is not None:
+                anomaly_map = normalize_min_max(
+                    anomaly_map,
+                    metadata["pixel_threshold"],
+                    metadata["min"],
+                    metadata["max"]
+                )
+            pred_scores = normalize_min_max(
+                pred_scores,
+                metadata["image_threshold"],
+                metadata["min"],
+                metadata["max"]
+            )
+        # Standardize pixel scores
+        if "pixel_mean" in metadata and "pixel_std" in metadata:
+            if anomaly_map is not None:
+                anomaly_map = standardize(
+                    anomaly_map,
+                    metadata["pixel_mean"],
+                    metadata["pixel_std"],
+                    center_at=metadata["image_mean"]
+                )
+                anomaly_map = normalize_cdf(
+                    anomaly_map,
+                    metadata["pixel_threshold"]
+                )
+        # Standardize image scores
+        if "image_mean" in metadata and "image_std" in metadata:
+            pred_scores = standardize(
+                pred_scores,
+                metadata["image_mean"],
+                metadata["image_std"]
+            )
+            pred_scores = normalize_cdf(
+                pred_scores,
+                metadata["image_threshold"]
+            )
+        return anomaly_map, float(pred_scores)

inference/openvino/utils.py ADDED Viewed

	@@ -0,0 +1,79 @@

+from typing import *
+from pathlib import Path
+import cv2
+import numpy as np
+from scipy.stats import norm
+def read_image(
+        path: Union[str, Path],
+        image_size: Union[int, Tuple[int, int], None]=None
+        ) -> np.ndarray:
+    """Read image from file path in RGB format.
+    Args:
+        path (str | Path): Path to image file.
+        image_size (int | tuple[int, int] | None, optional): Resize image.
+    Returns:
+        image (np.ndarray): The image array.
+    Example:
+        >>> read_image("/path/to/image.jpg", 256)
+    """
+    if isinstance(path, Path):
+        path = str(path)
+    image = cv2.imread(path)
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    if image_size:
+        if isinstance(image_size, int):
+            image_size = (image_size, image_size)
+        image = cv2.resize(image, image_size, interpolation=cv2.INTER_AREA)
+    return image
+def standardize(
+        targets: np.ndarray,
+        mean: float,
+        std: float,
+        center_at: float | None = None
+    ) -> np.ndarray:
+    """Standardize the targets to the z-domain."""
+    targets = np.log(targets)
+    standardized = (targets - mean) / std
+    if center_at:
+        standardized -= (center_at - mean) / std
+    return standardized
+def normalize_cdf(targets: np.ndarray, threshold: float) -> np.ndarray:
+    return norm.cdf(targets - threshold)
+def normalize_min_max(
+        targets: np.ndarray | np.float32,
+        threshold: float | np.ndarray,
+        min_val: float | np.ndarray,
+        max_val: float | np.ndarray
+    ) -> np.ndarray:
+    normalized = ((targets - threshold) / (max_val - min_val)) + 0.5
+    normalized = np.minimum(normalized, 1)
+    normalized = np.maximum(normalized, 0)
+    return normalized
+def get_boxes(mask: np.ndarray) -> np.ndarray:
+    """Get bounding boxes from masks.
+    Args:
+        masks (np.ndarray): Input mask of shape (H, W).
+    Returns:
+        boxes (np.ndarray): Array of shape (N, 4) containing bounding boxes in xyxy format.
+    """
+    _, comps = cv2.connectedComponents(mask)
+    labels = comps = np.unique(comps)
+    boxes = []
+    for label in labels[labels != 0]:
+        y_loc, x_loc = np.where(comps == label)
+        boxes.append((np.min(x_loc), np.min(y_loc), np.max(x_loc), np.ma(y_loc)))
+    boxes = np.stack(boxes) if boxes else np.empty((0, 4))
+    return boxes

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+OmegaConf>=2.1.1
+albumentations>=1.1.0,<2.0.0
+opencv-python>=4.5.3.56
+scipy>=1.11.4,<2.0.0
+openvino>=2023.2.0,<2024.0.0