learnables · 210057zzh · Oct 17, 2022 · Oct 18, 2022 · Oct 18, 2022 · Oct 18, 2022
diff --git a/tests/unit/svm/__init__.py b/tests/unit/svm/__init__.py
diff --git a/tests/unit/svm/linear_svc_test.py b/tests/unit/svm/linear_svc_test.py
@@ -0,0 +1,55 @@
+import unittest
+import numpy as np
+import torch
+from sklearn.datasets import make_classification
+import sklearn.svm as svm
+import time
+
+from torchml.svm import LinearSVC
+
+n_samples = 5000
+n_features = 10
+n_classes = 5
+n_informative = 7
+
+
+class TestLinearSVC(unittest.TestCase):
+    def test_LinearSVC(self):
+        x, y = make_classification(
+            n_samples=n_samples,
+            n_features=n_features,
+            n_classes=n_classes,
+            n_informative=n_informative,
+            n_redundant=n_features - n_informative,
+        )
+        lsvc = LinearSVC(max_iter=1000)
+        start = time.time()
+        lsvc.fit(torch.from_numpy(x), torch.from_numpy(y))
+        end = time.time()
+        # print(end - start)
+        start = time.time()
+        reflsvc = svm.LinearSVC(max_iter=100000)
+        reflsvc.fit(x, y)
+
+        end = time.time()
+        # print(end - start)
+        self.assertTrue(np.allclose(lsvc.coef_.numpy(), reflsvc.coef_, atol=1e-2))
+        self.assertTrue(
+            np.allclose(lsvc.intercept_.numpy(), reflsvc.intercept_, atol=1e-2)
+        )
+        self.assertTrue(
+            np.allclose(
+                lsvc.decision_function(torch.from_numpy(x)),
+                reflsvc.decision_function(x),
+                atol=1e-2,
+            )
+        )
+        self.assertTrue(
+            np.allclose(
+                lsvc.predict(torch.from_numpy(x)), reflsvc.predict(x), atol=1e-2
+            )
+        )
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/torchml/neighbors/nearest_centroid.py b/torchml/neighbors/nearest_centroid.py
@@ -116,8 +116,7 @@ def predict(self, X: torch.tensor) -> torch.tensor:
 
         for i in range(X.size(dim=0)):
             ret[i] = self.classes_[
-                torch.argmin(torch.nn.PairwiseDistance(p=2)
-                             (X[i], self.centroids_))
+                torch.argmin(torch.nn.PairwiseDistance(p=2)(X[i], self.centroids_))
             ]
 
         # return ret.to(self.y_type)

diff --git a/torchml/svm/__init__.py b/torchml/svm/__init__.py
@@ -0,0 +1 @@
+from .linear_svc import LinearSVC
diff --git a/torchml/svm/linear_svc.py b/torchml/svm/linear_svc.py
@@ -0,0 +1,217 @@
+import torch
+
+import torchml as ml
+import cvxpy as cp
+
+
+class LinearSVC(ml.Model):
+    """
+    ## Description
+
+    Support vector classifier with cvxpy
+
+    ## References
+
+    1. Bernhard E. Boser, Isabelle M. Guyon, and Vladimir N. Vapnik. 1992. A training algorithm for optimal margin classifiers. In Proceedings of the fifth annual workshop on Computational learning theory (COLT '92). Association for Computing Machinery, New York, NY, USA, 144–152. https://doi.org/10.1145/130385.130401
+    2. MIT 6.034 Artificial Intelligence, Fall 2010, [16. Learning: Support Vector Machines](https://youtu.be/_PwhiWxHK8o)
+    3. The scikit-learn [documentation page](https://scikit-learn.org/stable/modules/generated/sklearn.svm.LinearSVC.html) for LinearSVC.
+
+    ## Arguments
+
+    * `penalty` (str {'l1', 'l2'}, default=’l2’):
+        Specifies the norm used in the penalization.
+
+    * `loss` (str {‘hinge’, ‘squared_hinge’}, default=’squared_hinge’):
+        Specifies the loss function. ‘hinge’ is the standard SVM loss.
+
+    * `dual` (bool, default=True):
+        Dummy variable to keep consistency with SKlearn's API, always 'False' for now.
+
+    * `tol` (float, default=1e-4)
+        Tolerance for stopping criteria.
+
+    * `C` (float, default=1.0):
+        Regularization parameter. The strength of the regularization is inversely proportional to C. Must be strictly positive.
+
+    * `multi_class` (str {‘ovr’, ‘crammer_singer’}, default=’ovr’):
+        Dummy variable, always 'ovr' (one class over all the other as a single class)
+
+    * `fit_intercept` (bool, default=True):
+        Whether to calculate the intercept for this model.
+
+    * `intercept_scaling` (float, default=1):
+        Dummy variable to mimic the sklearn API, always 1 for now
+
+    * `class_weight` (dict or str ‘balanced’, default=None):
+        Dummy variable to mimic the sklearn API, always None for now
+
+    * `verbose` (int, default=0):
+        Dummy variable to mimic the sklearn API, always 0 for now
+
+    * `random_state` (int, RandomState instance or None, default=None):
+        Dummy variable to mimic the sklearn API, always None for now
+
+    * `max_iter` (int, default=1000):
+        The maximum number of iterations to be run for the underneath convex solver.
+
+
+    ## Example
+
+    ~~~python
+    import numpy as np
+    from torchml.svm import LinearSVC
+    from sklearn.datasets import make_classification
+
+    x, y = make_classification(
+            n_samples=n_samples,
+            n_features=n_features,
+            n_classes=n_classes,
+            n_informative=n_informative,
+            n_redundant=n_features - n_informative,
+        )
+    svc = LinearSVC(max_iter=1000)
+    svc.fit(torch.from_numpy(x), torch.from_numpy(y))
+    svc.decision_function(torch.from_numpy(x)
+    svc.predict(torch.from_numpy(x))
+    ~~~
+    """
+
+    def __init__(
+        self,
+        penalty="l2",
+        loss="squared_hinge",
+        *,
+        dual=True,
+        tol=1e-4,
+        C=1.0,
+        multi_class="ovr",
+        fit_intercept=True,
+        intercept_scaling=1,
+        class_weight=None,
+        verbose=0,
+        random_state=None,
+        max_iter=1000,
+    ):
+        super(LinearSVC, self).__init__()
+        self.coef_ = None
+        self.intercept_ = None
+        self.classes_ = None
+        self.dual = dual
+        self.tol = tol
+        self.C = C
+        self.multi_class = multi_class
+        self.fit_intercept = fit_intercept
+        self.intercept_scaling = intercept_scaling
+        self.class_weight = class_weight
+        self.verbose = verbose
+        self.random_state = random_state
+        self.max_iter = max_iter
+        self.penalty = penalty
+        self.loss = loss
+
+    def fit(self, X: torch.Tensor, y: torch.Tensor, sample_weight=None):
+        """
+        ## Description
+
+        Initialize the class with training sets
+
+        ## Arguments
+        * `X` (torch.Tensor): the training set
+        * `y` (torch.Tensor, default=None): the class labels for each sample
+
+        """
+        if self.C < 0:
+            raise ValueError(
+                "Penalty term must be positive; got (C=%r)" % self.C)
+        self.classes_ = torch.unique(y)
+        assert X.shape[0] == y.shape[0], "Number of X and y rows don't match"
+        m, n = X.shape
+        self.coef_ = torch.empty((0, n))
+        self.intercept_ = torch.empty((0))
+        if self.classes_.shape[0] == 2:
+            self._fit_with_one_class(
+                X, y, self.classes_[1], sample_weight=sample_weight
+            )
+        else:
+            for i, x in enumerate(self.classes_):
+                self._fit_with_one_class(X, y, x, sample_weight=sample_weight)
+
+    def decision_function(self, X: torch.Tensor) -> torch.Tensor:
+        """
+        ## Description
+
+        Predict confidence scores for samples.
+
+        ## Arguments
+        * `X` (torch.Tensor): the data set for which we want to get the confidence scores.
+
+        """
+        return X @ self.coef_.T + self.intercept_
+
+    def predict(self, X: torch.Tensor) -> torch.Tensor:
+        """
+        ## Description
+
+        Predict the class labels for the provided data.
+
+        ## Arguments
+
+        * `X` (torch.Tensor): the target point
+        """
+        scores = self.decision_function(X)
+        if len(scores.shape) == 1:
+            indices = (scores > 0).int()
+        else:
+            indices = scores.argmax(dim=1)
+        return self.classes_[indices]
+
+    def _fit_with_one_class(
+        self, X: torch.Tensor, y: torch.Tensor, fitting_class: any, sample_weight=None
+    ):
+
+        m, n = X.shape
+
+        y = torch.unsqueeze(y, 1)
+
+        y = (y == fitting_class).float()
+        y *= 2
+        y -= 1
+
+        w = cp.Variable((n, 1))
+        if self.fit_intercept:
+            b = cp.Variable()
+        X_param = cp.Parameter((m, n))
+        y_param = cp.Parameter((m, 1))
+        C_param = cp.Parameter(nonneg=True)
+        ones = torch.ones((m, 1))
+
+        loss = cp.multiply((1 / 2.0), cp.norm(w, 2))
+
+        if self.fit_intercept:
+            hinge = cp.pos(ones - cp.multiply(y_param, X_param @ w + b))
+        else:
+            hinge = cp.pos(ones - cp.multiply(y_param, X_param @ w))
+
+        if self.loss == "squared_hinge":
+            loss += C_param * cp.sum(cp.square(hinge))
+        elif self.loss == "hinge":
+            loss += C_param * cp.sum(hinge)
+
+        objective = loss
+
+        # set up constraints
+        constraints = []
+
+        prob = cp.Problem(cp.Minimize(objective), constraints)
+        X_param.value = X.numpy()
+        y_param.value = y.numpy()
+        C_param.value = self.C
+        prob.solve(solver="ECOS", abstol=self.tol, max_iters=self.max_iter)
+
+        self.coef_ = torch.cat(
+            (self.coef_, torch.t(torch.from_numpy(w.value))))
+        if self.fit_intercept:
+            self.intercept_ = torch.cat(
+                (self.intercept_, torch.unsqueeze(torch.from_numpy(b.value), 0))
+            )
+        return self