SeldonIO
diff --git a/‎alibi_detect/od/_svm.py‎
Lines changed: 236 additions & 0 deletions b/‎alibi_detect/od/_svm.py‎
Lines changed: 236 additions & 0 deletions
diff --git a/‎alibi_detect/od/pytorch/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎alibi_detect/od/pytorch/__init__.py‎
Lines changed: 1 addition & 0 deletions
@@ -0,0 +1,236 @@
+from typing import TYPE_CHECKING, Any, Dict, Optional, Tuple, Union
+
+import numpy as np
+
+from alibi_detect.base import (BaseDetector, FitMixin, ThresholdMixin,
+                               outlier_prediction_dict)
+from alibi_detect.exceptions import _catch_error as catch_error
+from alibi_detect.od.pytorch import SgdSVMTorch, BgdSVMTorch
+from alibi_detect.utils._types import Literal
+from alibi_detect.utils.frameworks import BackendValidator
+from alibi_detect.version import __version__
+
+
+if TYPE_CHECKING:
+    import torch
+
+
+backends = {
+    'pytorch': {
+        'sgd': SgdSVMTorch,
+        'bgd': BgdSVMTorch
+    }
+}
+
+
+class SVM(BaseDetector, ThresholdMixin, FitMixin):
+    def __init__(
+        self,
+        nu: float,
+        n_components: Optional[int] = None,
+        kernel: 'torch.nn.Module' = None,
+        optimization: Literal['sgd', 'bgd'] = 'sgd',
+        backend: Literal['pytorch'] = 'pytorch',
+        device: Optional[Union[Literal['cuda', 'gpu', 'cpu'], 'torch.device']] = None,
+    ) -> None:
+        """One-Class Support vector machine (OCSVM) outlier detector.
+
+        The one-class Support vector machine outlier detector fits a one-class SVM to the reference data.
+
+        Rather than the typical approach of optimizing the exact kernel OCSVM objective through a dual formulation,
+        here we instead map the data into the kernel's RKHS and then solve the linear optimization problem
+        directly through its primal formulation. The Nystroem approximation is used to speed up training and inference
+        by approximating the kernel's RKHS.
+
+        We provide two options, specified by the `optimization` parameter, for optimizing the one-class svm. `''sgd''`
+        wraps the `SGDOneClassSVM` class from the sklearn package and the other, `''bgd''` uses a custom implementation
+        in PyTorch. The PyTorch approach is tailored for operation on GPUs. Instead of applying stochastic gradient
+        descent (one data point at a time) with a fixed learning rate schedule it performs full gradient descent with
+        step size chosen at each iteration via line search. Note that on a CPU this would not necessarily be preferable
+        to SGD as we would have to iterate through both data points and candidate step sizes, however on GPU all of the
+        operations are vectorized/parallelized. Moreover, the Nystroem approximation has complexity `O(n^2m)` where
+        `n` is the number of reference instances and `m` defines the number of inducing points. This can therefore be
+        expensive for large reference sets and benefits from implementation on the GPU.
+
+        In general if using a small dataset then using the `''cpu''` with the optimization `''sgd''` is the best choice.
+        Whereas if using a large dataset then using the `''gpu''` with the optimization `''bgd''` is the best choice.
+
+        Parameters
+        ----------
+        nu
+            The proportion of the training data that should be considered outliers. Note that this does not necessarily
+            correspond to the false positive rate on test data, which is still defined when calling the
+            `infer_threshold` method. `nu` should be thought of as a regularization parameter that affects how smooth
+            the svm decision boundary is.
+        n_components
+            Number of components in the Nystroem approximation, By default uses all of them.
+        kernel
+            Kernel function to use for outlier detection. Should be an instance of a subclass of `torch.nn.Module`. If
+            not specified then defaults to the `GaussianRBF`.
+        optimization
+            Optimization method to use. Choose from ``'sgd'`` or ``'bgd'``. Defaults to ``'sgd'``.
+        backend
+            Backend used for outlier detection. Defaults to ``'pytorch'``. Options are ``'pytorch'``.
+        device
+            Device type used. The default tries to use the GPU and falls back on CPU if needed. Can be specified by
+            passing either ``'cuda'``, ``'gpu'``, ``'cpu'`` or an instance of ``torch.device``.
+
+        Raises
+        ------
+        NotImplementedError
+            If choice of `backend` is not implemented.
+        ValueError
+            If choice of `optimization` is not valid.
+        ValueError
+            If `n_components` is not a positive integer.
+        """
+        super().__init__()
+
+        if optimization not in ('sgd', 'bgd'):
+            raise ValueError(f'Optimization {optimization} not recognized. Choose from `sgd` or `bgd`.')
+
+        if n_components is not None and n_components <= 0:
+            raise ValueError(f'n_components must be a positive integer, got {n_components}.')
+
+        backend_str: str = backend.lower()
+        BackendValidator(
+            backend_options={'pytorch': ['pytorch']},
+            construct_name=self.__class__.__name__
+        ).verify_backend(backend_str)
+
+        backend_cls = backends[backend][optimization]
+        args: Dict[str, Any] = {
+            'n_components': n_components,
+            'kernel': kernel,
+            'nu': nu
+        }
+        args['device'] = device
+        self.backend = backend_cls(**args)
+
+    def fit(
+        self,
+        x_ref: np.ndarray,
+        tol: float = 1e-6,
+        max_iter: int = 1000,
+        step_size_range: Tuple[float, float] = (1e-8, 1.0),
+        n_step_sizes: int = 16,
+        n_iter_no_change: int = 25,
+        verbose: int = 0,
+    ) -> None:
+        """Fit the detector on reference data.
+
+        Uses the choice of optimization method to fit the svm model to the data.
+
+        Parameters
+        ----------
+        x_ref
+            Reference data used to fit the detector.
+        tol
+            Convergence threshold used to fit the detector. Used for both ``'sgd'`` and ``'bgd'`` optimizations.
+            Defaults to ``1e-3``.
+        max_iter
+            The maximum number of optimization steps. Used for both ``'sgd'`` and ``'bgd'`` optimizations.
+        step_size_range
+            The range of values to be considered for the gradient descent step size at each iteration. This is specified
+            as a tuple of the form `(min_eta, max_eta)` and only used for the ``'bgd'`` optimization.
+        n_step_sizes
+            The number of step sizes in the defined range to be tested for loss reduction. This many points are spaced
+            evenly along the range in log space. This is only used for the ``'bgd'`` optimization.
+        n_iter_no_change
+            The number of iterations over which the loss must decrease by `tol` in order for optimization to continue.
+            This is only used for the ``'bgd'`` optimization..
+        verbose
+            Verbosity level during training. ``0`` is silent, ``1`` prints fit status. If using `bgd`, fit displays a
+            progress bar. Otherwise, if using `sgd` then we output the Sklearn `SGDOneClassSVM.fit()` logs.
+        """
+        self.backend.fit(
+            self.backend._to_tensor(x_ref),
+            **self.backend.format_fit_kwargs(locals())
+        )
+
+    @catch_error('NotFittedError')
+    def score(self, x: np.ndarray) -> np.ndarray:
+        """Score `x` instances using the detector.
+
+        Scores the data using the fitted svm model. The higher the score, the more anomalous the instance.
+
+        Parameters
+        ----------
+        x
+            Data to score. The shape of `x` should be `(n_instances, n_features)`.
+
+        Returns
+        -------
+        Outlier scores. The shape of the scores is `(n_instances,)`. The higher the score, the more anomalous the \
+        instance.
+
+        Raises
+        ------
+        NotFittedError
+            If called before detector has been fit.
+        """
+        score = self.backend.score(self.backend._to_tensor(x))
+        return self.backend._to_numpy(score)
+
+    @catch_error('NotFittedError')
+    def infer_threshold(self, x: np.ndarray, fpr: float) -> None:
+        """Infer the threshold for the SVM detector.
+
+        The threshold is computed so that the outlier detector would incorrectly classify `fpr` proportion of the
+        reference data as outliers.
+
+        Parameters
+        ----------
+        x
+            Reference data used to infer the threshold.
+        fpr
+            False positive rate used to infer the threshold. The false positive rate is the proportion of
+            instances in `x` that are incorrectly classified as outliers. The false positive rate should
+            be in the range ``(0, 1)``.
+
+        Raises
+        ------
+        ValueError
+            Raised if `fpr` is not in ``(0, 1)``.
+        NotFittedError
+            If called before detector has been fit.
+        """
+        self.backend.infer_threshold(self.backend._to_tensor(x), fpr)
+
+    @catch_error('NotFittedError')
+    def predict(self, x: np.ndarray) -> Dict[str, Any]:
+        """Predict whether the instances in `x` are outliers or not.
+
+        Scores the instances in `x` and if the threshold was inferred, returns the outlier labels and p-values as well.
+
+        Parameters
+        ----------
+        x
+            Data to predict. The shape of `x` should be `(n_instances, n_features)`.
+
+        Returns
+        -------
+        Dictionary with keys 'data' and 'meta'. 'data' contains the outlier scores. If threshold inference was  \
+        performed, 'data' also contains the threshold value, outlier labels and p-vals . The shape of the scores is \
+        `(n_instances,)`. The higher the score, the more anomalous the instance. 'meta' contains information about \
+        the detector.
+
+        Raises
+        ------
+        NotFittedError
+            If called before detector has been fit.
+        """
+        outputs = self.backend.predict(self.backend._to_tensor(x))
+        output = outlier_prediction_dict()
+        output['data'] = {
+            **output['data'],
+            **self.backend._to_numpy(outputs)
+        }
+        output['meta'] = {
+            **output['meta'],
+            'name': self.__class__.__name__,
+            'detector_type': 'outlier',
+            'online': False,
+            'version': __version__,
+        }
+        return output
@@ -6,3 +6,4 @@
 KernelPCATorch, LinearPCATorch = import_optional('alibi_detect.od.pytorch.pca', ['KernelPCATorch', 'LinearPCATorch'])
 Ensembler = import_optional('alibi_detect.od.pytorch.ensemble', ['Ensembler'])
 GMMTorch = import_optional('alibi_detect.od.pytorch.gmm', ['GMMTorch'])
+BgdSVMTorch, SgdSVMTorch = import_optional('alibi_detect.od.pytorch.svm', ['BgdSVMTorch', 'SgdSVMTorch'])