SeldonIO
diff --git a/‎alibi_detect/od/_knn.py
Lines changed: 1 addition & 1 deletion b/‎alibi_detect/od/_knn.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎alibi_detect/od/_mahalanobis.py
Lines changed: 1 addition & 2 deletions b/‎alibi_detect/od/_mahalanobis.py
Lines changed: 1 addition & 2 deletions
diff --git a/‎alibi_detect/od/_pca.py
Lines changed: 206 additions & 0 deletions b/‎alibi_detect/od/_pca.py
Lines changed: 206 additions & 0 deletions
diff --git a/‎alibi_detect/od/pytorch/__init__.py
Lines changed: 1 addition & 0 deletions b/‎alibi_detect/od/pytorch/__init__.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎alibi_detect/od/pytorch/base.py
Lines changed: 5 additions & 1 deletion b/‎alibi_detect/od/pytorch/base.py
Lines changed: 5 additions & 1 deletion
diff --git a/‎alibi_detect/od/pytorch/knn.py
Lines changed: 2 additions & 2 deletions b/‎alibi_detect/od/pytorch/knn.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎alibi_detect/od/pytorch/mahalanobis.py
Lines changed: 4 additions & 4 deletions b/‎alibi_detect/od/pytorch/mahalanobis.py
Lines changed: 4 additions & 4 deletions
@@ -1,9 +1,9 @@
 from typing import Callable, Union, Optional, Dict, Any, List, Tuple
 from typing import TYPE_CHECKING
+from typing_extensions import Literal
 
 import numpy as np
 
-from typing_extensions import Literal
 from alibi_detect.base import outlier_prediction_dict
 from alibi_detect.exceptions import _catch_error as catch_error
 from alibi_detect.od.base import TransformProtocol, TransformProtocolType
 
@@ -1,11 +1,10 @@
 from typing import Union, Optional, Dict, Any
 from typing import TYPE_CHECKING
 from alibi_detect.exceptions import _catch_error as catch_error
-
+from typing_extensions import Literal
 
 import numpy as np
 
-from alibi_detect.utils._types import Literal
 from alibi_detect.base import BaseDetector, FitMixin, ThresholdMixin, outlier_prediction_dict
 from alibi_detect.od.pytorch import MahalanobisTorch
 from alibi_detect.utils.frameworks import BackendValidator
 
@@ -0,0 +1,206 @@
+from typing import Union, Optional, Callable, Dict, Any
+from typing import TYPE_CHECKING
+from typing_extensions import Literal
+
+import numpy as np
+
+from alibi_detect.base import outlier_prediction_dict
+from alibi_detect.base import BaseDetector, ThresholdMixin, FitMixin
+from alibi_detect.od.pytorch import KernelPCATorch, LinearPCATorch
+from alibi_detect.utils.frameworks import BackendValidator
+from alibi_detect.version import __version__
+from alibi_detect.exceptions import _catch_error as catch_error
+
+
+if TYPE_CHECKING:
+    import torch
+
+
+backends = {
+    'pytorch': (KernelPCATorch, LinearPCATorch)
+}
+
+
+class PCA(BaseDetector, ThresholdMixin, FitMixin):
+    def __init__(
+        self,
+        n_components: int,
+        kernel: Optional[Callable] = None,
+        backend: Literal['pytorch'] = 'pytorch',
+        device: Optional[Union[Literal['cuda', 'gpu', 'cpu'], 'torch.device']] = None,
+    ) -> None:
+        """Principal Component Analysis (PCA) outlier detector.
+
+        The detector is based on the Principal Component Analysis (PCA) algorithm. There are two variants of PCA:
+        linear PCA and kernel PCA. Linear PCA computes the eigenvectors of the covariance matrix of the data. Kernel
+        PCA computes the eigenvectors of the kernel matrix of the data.
+
+        When scoring a test instance using the linear variant compute the distance to the principal subspace spanned
+        by the first `n_components` eigenvectors.
+
+        When scoring a test instance using the kernel variant we project it onto the largest eigenvectors and
+        compute its score using the L2 norm.
+
+        If a threshold is fitted we use this to determine whether the instance is an outlier or not.
+
+        Parameters
+        ----------
+        n_components:
+            The number of dimensions in the principal subspace. For linear pca should have
+            ``1 <= n_components < dim(data)``. For kernel pca should have ``1 <= n_components < len(data)``.
+        kernel
+            Kernel function to use for outlier detection. If ``None``, linear PCA is used instead of the
+            kernel variant.
+        backend
+            Backend used for outlier detection. Defaults to ``'pytorch'``. Options are ``'pytorch'``.
+        device
+            Device type used. The default tries to use the GPU and falls back on CPU if needed. Can be specified by
+            passing either ``'cuda'``, ``'gpu'``, ``'cpu'`` or an instance of ``torch.device``.
+
+        Raises
+        ------
+        NotImplementedError
+            If choice of `backend` is not implemented.
+        ValueError
+            If `n_components` is less than 1.
+        """
+        super().__init__()
+
+        backend_str: str = backend.lower()
+        BackendValidator(
+            backend_options={'pytorch': ['pytorch']},
+            construct_name=self.__class__.__name__
+        ).verify_backend(backend_str)
+
+        kernel_backend_cls, linear_backend_cls = backends[backend]
+
+        self.backend: Union[KernelPCATorch, LinearPCATorch]
+        if kernel is not None:
+            self.backend = kernel_backend_cls(
+                n_components=n_components,
+                device=device,
+                kernel=kernel
+            )
+        else:
+            self.backend = linear_backend_cls(
+                n_components=n_components,
+                device=device,
+            )
+
+    def fit(self, x_ref: np.ndarray) -> None:
+        """Fit the detector on reference data.
+
+        In the linear case we compute the principal components of the reference data using the
+        covariance matrix and then remove the largest `n_components` eigenvectors. The remaining
+        eigenvectors correspond to the invariant dimensions of the data. Changes in these
+        dimensions are used to compute the outlier score which is the distance to the principal
+        subspace spanned by the first `n_components` eigenvectors.
+
+        In the kernel case we compute the principal components of the reference data using the
+        kernel matrix and then return the largest `n_components` eigenvectors. These are then
+        normalized to have length equal to `1/eigenvalue`. Note that this differs from the
+        linear case where we remove the largest eigenvectors.
+
+        In both cases we then store the computed components to use later when we score test
+        instances.
+
+        Parameters
+        ----------
+        x_ref
+            Reference data used to fit the detector.
+
+        Raises
+        ------
+        ValueError
+            If using linear pca variant and `n_components` is greater than or equal to number of
+            features or if using kernel pca variant and `n_components` is greater than or equal
+            to number of instances.
+        """
+        self.backend.fit(self.backend._to_tensor(x_ref))
+
+    @catch_error('NotFittedError')
+    def score(self, x: np.ndarray) -> np.ndarray:
+        """Score `x` instances using the detector.
+
+        Project `x` onto the eigenvectors and compute the score using the L2 norm.
+
+        Parameters
+        ----------
+        x
+            Data to score. The shape of `x` should be `(n_instances, n_features)`.
+
+        Returns
+        -------
+        Outlier scores. The shape of the scores is `(n_instances,)`. The higher the score, the more anomalous the \
+        instance.
+
+        Raises
+        ------
+        NotFittedError
+            If called before detector has been fit.
+        """
+        score = self.backend.score(self.backend._to_tensor(x))
+        return self.backend._to_numpy(score)
+
+    @catch_error('NotFittedError')
+    def infer_threshold(self, x: np.ndarray, fpr: float) -> None:
+        """Infer the threshold for the PCA detector.
+
+        The threshold is computed so that the outlier detector would incorrectly classify `fpr` proportion of the
+        reference data as outliers.
+
+        Parameters
+        ----------
+        x
+            Reference data used to infer the threshold.
+        fpr
+            False positive rate used to infer the threshold. The false positive rate is the proportion of
+            instances in `x` that are incorrectly classified as outliers. The false positive rate should
+            be in the range ``(0, 1)``.
+
+        Raises
+        ------
+        ValueError
+            Raised if `fpr` is not in ``(0, 1)``.
+        NotFittedError
+            If called before detector has been fit.
+        """
+        self.backend.infer_threshold(self.backend._to_tensor(x), fpr)
+
+    @catch_error('NotFittedError')
+    def predict(self, x: np.ndarray) -> Dict[str, Any]:
+        """Predict whether the instances in `x` are outliers or not.
+
+        Scores the instances in `x` and if the threshold was inferred, returns the outlier labels and p-values as well.
+
+        Parameters
+        ----------
+        x
+            Data to predict. The shape of `x` should be `(n_instances, n_features)`.
+
+        Returns
+        -------
+        Dictionary with keys 'data' and 'meta'. 'data' contains the outlier scores. If threshold inference was  \
+        performed, 'data' also contains the threshold value, outlier labels and p-vals . The shape of the scores is \
+        `(n_instances,)`. The higher the score, the more anomalous the instance. 'meta' contains information about \
+        the detector.
+
+        Raises
+        ------
+        NotFittedError
+            If called before detector has been fit.
+        """
+        outputs = self.backend.predict(self.backend._to_tensor(x))
+        output = outlier_prediction_dict()
+        output['data'] = {
+            **output['data'],
+            **self.backend._to_numpy(outputs)
+        }
+        output['meta'] = {
+            **output['meta'],
+            'name': self.__class__.__name__,
+            'detector_type': 'outlier',
+            'online': False,
+            'version': __version__,
+        }
+        return output
@@ -2,4 +2,5 @@
 
 KNNTorch = import_optional('alibi_detect.od.pytorch.knn', ['KNNTorch'])
 MahalanobisTorch = import_optional('alibi_detect.od.pytorch.mahalanobis', ['MahalanobisTorch'])
+KernelPCATorch, LinearPCATorch = import_optional('alibi_detect.od.pytorch.pca', ['KernelPCATorch', 'LinearPCATorch'])
 Ensembler = import_optional('alibi_detect.od.pytorch.ensemble', ['Ensembler'])
@@ -1,4 +1,5 @@
 from typing import List, Union, Optional, Dict
+from typing_extensions import Literal
 from dataclasses import dataclass, asdict
 from abc import ABC, abstractmethod
 
@@ -60,7 +61,10 @@ class TorchOutlierDetector(torch.nn.Module, FitMixinTorch, ABC):
     threshold_inferred = False
     threshold = None
 
-    def __init__(self, device: Optional[Union[str, torch.device]] = None):
+    def __init__(
+            self,
+            device: Optional[Union[Literal['cuda', 'gpu', 'cpu'], 'torch.device']] = None,
+            ):
         self.device = get_device(device)
         super().__init__()
 
 
@@ -1,5 +1,5 @@
 from typing import Optional, Union, List, Tuple
-
+from typing_extensions import Literal
 import numpy as np
 import torch
 
@@ -13,7 +13,7 @@ def __init__(
             k: Union[np.ndarray, List, Tuple, int],
             kernel: Optional[torch.nn.Module] = None,
             ensembler: Optional[Ensembler] = None,
-            device: Optional[Union[str, torch.device]] = None
+            device: Optional[Union[Literal['cuda', 'gpu', 'cpu'], 'torch.device']] = None,
             ):
         """PyTorch backend for KNN detector.
 
 
@@ -1,5 +1,5 @@
 from typing import Optional, Union
-
+from typing_extensions import Literal
 import torch
 
 from alibi_detect.od.pytorch.base import TorchOutlierDetector
@@ -11,7 +11,7 @@ class MahalanobisTorch(TorchOutlierDetector):
     def __init__(
             self,
             min_eigenvalue: float = 1e-6,
-            device: Optional[Union[str, torch.device]] = None
+            device: Optional[Union[Literal['cuda', 'gpu', 'cpu'], 'torch.device']] = None,
             ):
         """PyTorch backend for Mahalanobis detector.
 
@@ -20,8 +20,8 @@ def __init__(
         min_eigenvalue
             Eigenvectors with eigenvalues below this value will be discarded.
         device
-            Device type used. The default None tries to use the GPU and falls back on CPU if needed.
-            Can be specified by passing either ``'cuda'``, ``'gpu'`` or ``'cpu'``.
+            Device type used. The default tries to use the GPU and falls back on CPU if needed. Can be specified by
+            passing either ``'cuda'``, ``'gpu'``, ``'cpu'`` or an instance of ``torch.device``.
         """
         super().__init__(device=device)
         self.min_eigenvalue = min_eigenvalue