SparseGroupLasso/subgradients_semisparse.py at master · rtavenar/SparseGroupLasso · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
import numpy
from utils import S, norm_non0, discard_group
from sklearn.base import Estimator

__author__ = 'Romain Tavenard romain.tavenard[at]univ-rennes2.fr'


class SGL(Estimator):
    def __init__(self, groups, alpha, lbda, ind_sparse, max_iter=10000, rtol=1e-6):
        self.ind_sparse = numpy.array(ind_sparse)
        self.groups = numpy.array(groups)
        self.alpha = alpha
        self.lbda = lbda
        self.max_iter = max_iter
        self.rtol = rtol
        self.coef_ = None

    def fit(self, X, y):
        # Assumption: group ids are between 0 and max(groups)
        # Other assumption: ind_sparse is of dimension X.shape[1] and has 0 if the dimension should not be pushed
        # towards sparsity and 1 otherwise
        n_groups = numpy.max(self.groups) + 1
        n, d = X.shape
        assert d == self.ind_sparse.shape[0]
        alpha_lambda = self.alpha * self.lbda * self.ind_sparse
        self.coef_ = numpy.random.randn(d)
        for iter in range(self.max_iter):
            beta_old = self.coef_.copy()
            for gr in range(n_groups):
                # 1- Should the group be zero-ed out?
                indices_group_k = self.groups == gr
                if discard_group(X, y, self.coef_, self.alpha, self.lbda, alpha_lambda, indices_group_k):
                    self.coef_[indices_group_k] = 0.
                else:
                    # 2- If the group is not zero-ed out, update each component
                    p_l = numpy.sqrt(numpy.sum(indices_group_k))
                    for i in range(d):
                        if self.groups[i] == gr:
                            norm2_beta_k = norm_non0(self.coef_[indices_group_k])
                            X_i_k = X[:, i]
                            r_no_i = y - numpy.dot(X, self.coef_) + self.coef_[i] * X_i_k
                            denom = numpy.dot(X_i_k.T, X_i_k) / n + (1 - self.alpha) * self.lbda * p_l / norm2_beta_k
                            self.coef_[i] = S(numpy.dot(X_i_k.T, r_no_i) / n, alpha_lambda[i]) / denom
            norm_beta = norm_non0(self.coef_)
            if numpy.linalg.norm(self.coef_ - beta_old) / norm_beta < self.rtol:
                break
        return self

    def predict(self, X):
        return numpy.dot(X, self.coef_)

    def fit_predict(self, X, y):
        return self.fit(X, y).predict(X)