Source code for abess.linear

import warnings
import numpy as np
from sklearn.metrics import r2_score, accuracy_score, ndcg_score
from .bess_base import bess_base
from .utilities import fix_docs, new_data_check
from .functions import (BreslowEstimator, concordance_index_censored)
# from .nonparametric import _compute_counts
try:
    from sklearn.metrics import d2_tweedie_score
except ImportError:
    from .functions import d2_tweedie_score


[docs]@ fix_docs
class LogisticRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection (ABESS) algorithm for logistic regression.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import LogisticRegression
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 100, p = 50, k = 10, family = 'binomial')
    >>> model = LogisticRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    LogisticRegression(support_size=10)
    >>> model.predict(data.x)[:10]
    array([0, 1, 0, 1, 1, 1, 0, 0, 0, 1])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = LogisticRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    LogisticRegression()
    >>> model.predict(data.x)[:10]
    array([0, 1, 0, 1, 1, 1, 0, 0, 0, 1])
    >>>
    >>> # path_type="gs"
    >>> model = LogisticRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    LogisticRegression(path_type='gs')
    >>> model.predict(data.x)[:10]
    array([0, 1, 0, 1, 1, 1, 0, 0, 0, 1])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="roc_auc",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Logistic", normalize_type=2,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='classifier'
        )

    def _more_tags(self):
        return {'binary_only': True,
                'no_validation': True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags.classifier_tags.multi_class = True
        tags.no_validation = True
        return tags

[docs]    def predict_proba(self, X):
        r"""
        Give the probabilities of new sample
        being assigned to different classes.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        proba : array-like, shape(n_samples, 2)
            Returns the probabilities for class "0" and "1"
            on given X.
        """
        X = new_data_check(self, X)

        intercept_ = np.ones(X.shape[0]) * self.intercept_
        xbeta = X.dot(self.coef_) + intercept_
        proba = np.exp(xbeta) / (1 + np.exp(xbeta))
        K = len(self.classes_)
        result = np.zeros((X.shape[0], K))
        result[:, 0] = 1.0 - proba
        result[:, 1] = proba
        return result

[docs]    def predict(self, X):
        r"""
        This function predicts class label for given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Predict class labels (0 or 1) for samples in X.
        """
        X = new_data_check(self, X)

        intercept_ = np.ones(X.shape[0]) * self.intercept_
        xbeta = X.dot(self.coef_) + intercept_
        y = np.repeat(self.classes_[0], xbeta.size)
        if self.classes_.size >= 2:
            y[xbeta > 0] = self.classes_[1]
        return y

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give new data, and it returns the prediction accuracy.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples,)
            Real class labels (0 or 1) for X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            The mean prediction accuracy on the given data.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)

        # intercept_ = np.ones(X.shape[0]) * self.intercept_
        # xbeta = X.dot(self.coef_) + intercept_
        # xbeta[xbeta > 30] = 30
        # xbeta[xbeta < -30] = -30
        # pr = np.exp(xbeta) / (1 + np.exp(xbeta))
        # return (y * np.log(pr) +
        #         (np.ones(X.shape[0]) - y) *
        #         np.log(np.ones(X.shape[0]) - pr)).sum()
        y_pred = self.predict(X)
        return accuracy_score(y, y_pred, sample_weight=sample_weight)


[docs]@ fix_docs
class LinearRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for linear regression.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import LinearRegression
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 100, p = 50, k = 10, family = 'gaussian')
    >>> model = LinearRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    LinearRegression(support_size=10)
    >>> model.predict(data.x)[:4]
    array([ -91.02169383,  100.7302593 , -226.99517096,    9.47389912])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = LinearRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    LinearRegression()
    >>> model.predict(data.x)[:4]
    array([ -91.02169383,  100.7302593 , -226.99517096,    9.47389912])
    >>>
    >>> # path_type="gs"
    >>> model = LinearRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    LinearRegression(path_type='gs')
    >>> model.predict(data.x)[:4]
    array([ -91.02169383,  100.7302593 , -226.99517096,    9.47389912])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 covariance_update=False,
                 # primary_model_fit_max_iter=10,
                 # primary_model_fit_epsilon=1e-8,
                 # approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Lm", normalize_type=1,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            thread=thread, covariance_update=covariance_update,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='regressor'
        )

    def _more_tags(self):
        return {'multioutput': False}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        return tags

[docs]    def predict(self, X):
        r"""
        Predict on given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Prediction of the mean on given X.
        """
        X = new_data_check(self, X)

        intercept_ = np.ones(X.shape[0]) * self.intercept_
        return X.dot(self.coef_) + intercept_

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give data, and it returns the coefficient of determination.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples, p_features)
            Real response for given X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            :math:`R^2` score.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)
        y_pred = self.predict(X)
        return r2_score(y, y_pred, sample_weight=sample_weight)


[docs]@ fix_docs
class CoxPHSurvivalAnalysis(bess_base, BreslowEstimator):
    r"""
    Adaptive Best-Subset Selection (ABESS) algorithm for
    Cox proportional hazards model.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import CoxPHSurvivalAnalysis
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 100, p = 50, k = 10, family = 'cox')
    censoring rate:0.6
    >>> model = CoxPHSurvivalAnalysis(support_size = 10)
    >>> model.fit(data.x, data.y)
    CoxPHSurvivalAnalysis(support_size=10)
    >>> model.predict(data.x)[:4]
    array([1.14440127e-01, 2.03621826e+04, 3.06214682e-08, 5.01932889e+02])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = CoxPHSurvivalAnalysis(path_type = "seq")
    >>> model.fit(data.x, data.y)
    CoxPHSurvivalAnalysis()
    >>> model.predict(data.x)[:4]
    array([1.36126061e-01, 1.38312962e+04, 5.95470917e-08, 3.87857074e+02])
    >>>
    >>> # path_type="gs"
    >>> model = CoxPHSurvivalAnalysis(path_type="gs")
    >>> model.fit(data.x, data.y)
    CoxPHSurvivalAnalysis(path_type='gs')
    >>> model.predict(data.x)[:4]
    array([1.48661058e-01, 1.19376056e+04, 5.80413711e-08, 4.73270508e+02])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Cox", normalize_type=3,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            baseline_model=BreslowEstimator()
        )

    def _more_tags(self):
        # Note: We ignore estimator's check here because it would pass
        # an 1-column `y` for testing, but for `CoxPHSurvivalAnalysis()`,
        # 2-column `y` should be given (one for time, another for censoring).
        return {'_skip_test': True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags._skip_test = True
        return tags

[docs]    def predict(self, X):
        r"""
        Returns the time-independent part of hazard function,
        i.e. :math:`\exp(X\beta)` on given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Return :math:`\exp(X\beta)`.
        """
        X = new_data_check(self, X)

        return np.exp(X.dot(self.coef_))

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give data, and it returns C-index.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples, p_features)
            Real response for given X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            C-index.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)
        risk_score = X.dot(self.coef_)
        y = np.array(y)
        result = concordance_index_censored(
            np.array(y[:, 1], np.bool_), y[:, 0],
            risk_score, sample_weight=sample_weight)
        return result[0]

[docs]    def predict_survival_function(self, X):
        r"""
        Predict survival function.
        The survival function for an individual
        with feature vector :math:`x` is defined as

        .. math::
            S(t \mid x) = S_0(t)^{\exp(x^\top \beta)} ,

        where :math:`S_0(t)` is the baseline survival function,
        estimated by Breslow's estimator.

        Parameters
        ----------
        X : array-like, shape = (n_samples, n_features)
            Data matrix.

        Returns
        -------
        survival : ndarray of :class:`StepFunction`, shape = (n_samples,)
            Predicted survival functions.
        """
        return self.baseline_model.get_survival_function(
            np.log(self.predict(X)))


[docs]@ fix_docs
class PoissonRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for Poisson regression.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import PoissonRegression
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 100, p = 50, k = 10, family = 'poisson')
    >>> model = PoissonRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    PoissonRegression(support_size=10)
    >>> model.predict(data.x)[:4]
    array([0.51647246, 1.72152904, 0.25906485, 1.11715123])


    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = PoissonRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    PoissonRegression()
    >>> model.predict(data.x)[:4]
    array([0.41189011, 1.34910167, 0.28326399, 1.05768798])
    >>>
    >>> # path_type="gs"
    >>> model = PoissonRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    PoissonRegression(path_type='gs')
    >>> model.predict(data.x)[:4]
    array([0.3824694 , 2.72926425, 0.14566451, 1.41221177])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Poisson", normalize_type=2,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            thread=thread,
            approximate_Newton=approximate_Newton,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='regressor'
        )

    def _more_tags(self):
        return {"poor_score": True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags.regressor_tags.poor_score = True
        return tags

[docs]    def predict(self, X):
        r"""
        Predict on given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Prediction of the mean on X.
        """
        X = new_data_check(self, X)

        intercept_ = np.ones(X.shape[0]) * self.intercept_
        xbeta_exp = np.exp(X.dot(self.coef_) + intercept_)
        return xbeta_exp

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give new data, and it returns the :math:`D^2` score.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples, p_features)
            Real response for given X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            :math:`D^2` score.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)

        # intercept_ = np.ones(X.shape[0]) * self.intercept_
        # eta = X.dot(self.coef_) + intercept_
        # exp_eta = np.exp(eta)
        # return (y * eta - exp_eta).sum()
        y_pred = self.predict(X)
        return d2_tweedie_score(y, y_pred, power=1,
                                sample_weight=sample_weight)


[docs]@ fix_docs
class MultiTaskRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for multitasklearning.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import MultiTaskRegression
    >>> from abess.datasets import make_multivariate_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_multivariate_glm_data(
    >>>     n = 100, p = 50, k = 10, M = 3, family = 'multigaussian')
    >>> model = MultiTaskRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    MultiTaskRegression(support_size=10)
    >>>
    >>> model.predict(data.x)[:5, ]
    array([[ 14.8632471 ,  -3.50042308,  11.88954251],
        [  9.50857154,  -3.63397256,  17.24496971],
        [ 27.74599919, -28.29785667, -13.26021431],
        [ 13.58562727,  -1.02215199,   5.06593256],
        [-29.18519221,  18.64600541,  15.44881672]])


    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = MultiTaskRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    MultiTaskRegression()
    >>> model.predict(data.x)[:5, ]
    array([[ 14.67257826,  -4.2882759 ,  12.050597  ],
        [  8.99687125,  -5.74834275,  17.67719359],
        [ 27.60141854, -28.89527087, -13.13808967],
        [ 13.63623637,  -0.81303274,   5.02318398],
        [-28.48945127,  21.52084036,  14.86113707]])
    >>>
    >>> # path_type="gs"
    >>> model = MultiTaskRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    MultiTaskRegression(path_type='gs')
    >>> model.predict(data.x)[:5, ]
    array([[ 14.67257826,  -4.2882759 ,  12.050597  ],
        [  8.99687125,  -5.74834275,  17.67719359],
        [ 27.60141854, -28.89527087, -13.13808967],
        [ 13.63623637,  -0.81303274,   5.02318398],
        [-28.48945127,  21.52084036,  14.86113707]])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 covariance_update=False,
                 # primary_model_fit_max_iter=10,
                 # primary_model_fit_epsilon=1e-8,
                 # approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Multigaussian",
            normalize_type=1, path_type=path_type,
            max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            thread=thread, covariance_update=covariance_update,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='regressor'
        )

    def _more_tags(self):
        return {'multioutput': True,
                'multioutput_only': True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags.target_tags.multi_output = True
        tags.target_tags.single_output = False
        return tags

[docs]    def predict(self, X):
        r"""
        Prediction of the mean of each response on given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples, M_responses)
            Prediction of the mean of each response on given X.
            Each column indicates one response.
        """
        X = new_data_check(self, X)

        intercept_ = np.repeat(
            self.intercept_[np.newaxis, ...], X.shape[0], axis=0)
        y_pred = X.dot(self.coef_) + intercept_
        if len(y_pred.shape) == 1:
            y_pred = y_pred[:, np.newaxis]
        return y_pred

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give data, and it returns the coefficient of determination.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples, M_responses)
            Real responses for given X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            :math:`R^2` score.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)

        y_pred = self.predict(X)
        return r2_score(y, y_pred, sample_weight=sample_weight)


[docs]@ fix_docs
class MultinomialRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for
    multiclassification problem.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import MultinomialRegression
    >>> from abess.datasets import make_multivariate_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_multivariate_glm_data(
    >>>     n = 100, p = 50, k = 10, M = 3, family = 'multinomial')
    >>> model = MultinomialRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    MultinomialRegression(support_size=10)
    >>> model.predict(data.x)[:10, ]
    array([0, 2, 0, 0, 1, 1, 1, 1, 1, 0])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = MultinomialRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    MultinomialRegression()
    >>> model.predict(data.x)[:10, ]
    array([0, 2, 0, 0, 1, 1, 1, 1, 1, 0])
    >>>
    >>> # path_type="gs"
    >>> model = MultinomialRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    MultinomialRegression(path_type='gs')
    >>> model.predict(data.x)[:10, ]
    array([0, 2, 0, 0, 1, 1, 1, 1, 1, 0])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 # approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Multinomial", normalize_type=2,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=True,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='classifier'
        )

    def _more_tags(self):
        return {'multilabel': False,
                # 'multioutput_only': True,
                'no_validation': True,
                'poor_score': True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags.no_validation = True
        tags.classifier_tags.poor_score = True
        return tags

[docs]    def predict_proba(self, X):
        r"""
        Give the probabilities of new data being assigned to different classes.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        proba : array-like, shape(n_samples, M_responses)
            Returns the probability of given samples for each class.
            Each column indicates one class.
        """
        X = new_data_check(self, X)

        intercept_ = np.repeat(
            self.intercept_[np.newaxis, ...], X.shape[0], axis=0)
        xbeta = X.dot(self.coef_) + intercept_
        eta = np.exp(xbeta)
        pr = np.zeros_like(xbeta)
        for i in range(X.shape[0]):
            pr[i, :] = eta[i, :] / np.sum(eta[i, :])
        return pr

[docs]    def predict(self, X):
        r"""
        Return the most possible class for given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples, )
            Predicted class label for each sample in X.
        """
        X = new_data_check(self, X)

        intercept_ = np.repeat(
            self.intercept_[np.newaxis, ...], X.shape[0], axis=0)
        xbeta = X.dot(self.coef_) + intercept_
        max_item = np.argmax(xbeta, axis=1)
        # y_pred = np.zeros_like(xbeta)
        # for i in range(X.shape[0]):
        #     y_pred[i, max_item[i]] = 1
        cl = getattr(self, "classes_", np.arange(self.coef_.shape[1]))
        return cl[max_item]

[docs]    def score(self, X, y, sample_weight=None):
        """
        Give new data, and it returns the prediction accuracy.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Test data.
        y : array-like, shape(n_samples, M_responses)
            Test response (dummy variables of real class).
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            the mean prediction accuracy.
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)
        # if (len(y.shape) == 1 or y.shape[1] == 1):
        #     y, _ = categorical_to_dummy(y.squeeze())

        # pr = self.predict_proba(X)
        # return np.sum(y * np.log(pr))
        y_true = np.zeros(X.shape[0])
        if (len(y.shape) > 1 and y.shape[1] == self.coef_.shape[1]):
            # if given dummy y
            y_true = np.nonzero(y)[1]
        else:
            y_true = y
        y_pred = self.predict(X)
        return accuracy_score(y_true, y_pred, sample_weight=sample_weight)


[docs]@ fix_docs
class GammaRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for Gamma regression.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import GammaRegression
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 100, p = 50, k = 10, family = 'gamma')
    >>> model = GammaRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    GammaRegression(support_size=10)
    >>> model.predict(data.x)[:4]
    array([0.01295776, 0.01548078, 0.01221642, 0.01623115])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = GammaRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    GammaRegression()
    >>> model.predict(data.x)[:4]
    array([0.01779091, 0.01779091, 0.01779091, 0.01779091])
    >>>
    >>> # path_type="gs"
    >>> model = GammaRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    GammaRegression(path_type='gs')
    >>> model.predict(data.x)[:4]
    array([0.01779091, 0.01779091, 0.01779091, 0.01779091])

    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 fit_intercept=True,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Gamma", normalize_type=2,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, fit_intercept=fit_intercept, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            thread=thread, approximate_Newton=approximate_Newton,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search,
            _estimator_type='regressor'
        )

    def _more_tags(self):
        return {'poor_score': True,
                'requires_positive_y': True}

    def __sklearn_tags__(self):
        tags = super().__sklearn_tags__()
        tags.regressor_tags.poor_score = True
        tags.target_tags.positive_only = True
        return tags

[docs]    def predict(self, X):
        r"""
        Predict on given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Prediction of the mean on given X.
        """
        X = new_data_check(self, X)

        intercept_ = np.ones(X.shape[0]) * self.intercept_
        xbeta_exp = - 1 / (X.dot(self.coef_) + intercept_)
        return xbeta_exp

[docs]    def score(self, X, y, sample_weight=None):
        r"""
        Give new data, and it returns the prediction error.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix.
        y : array-like, shape(n_samples, p_features)
            Real response for given X.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.

        Returns
        -------
        score : float
            Prediction error.
        """
        # if weights is None:
        #     X = np.array(X)
        #     weights = np.ones(X.shape[0])
        # X, y, weights = new_data_check(self, X, y, weights)

        # def deviance(y, y_pred):
        #     dev = 2 * (np.log(y_pred / y) + y / y_pred - 1)
        #     return np.sum(weights * dev)

        # y_pred = self.predict(X)
        # y_mean = np.average(y, weights=weights)
        # dev = deviance(y, y_pred)
        # dev_null = deviance(y, y_mean)
        # return 1 - dev / dev_null
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)
        y_pred = self.predict(X)
        y_pred = np.clip(y_pred, 1e-10, None)
        try:
            return d2_tweedie_score(y, y_pred, power=2,
                                    sample_weight=sample_weight)
        except ValueError:
            from sklearn.metrics import r2_score
            return r2_score(y, y_pred, sample_weight=sample_weight)


[docs]@ fix_docs
class OrdinalRegression(bess_base):
    r"""
    Adaptive Best-Subset Selection(ABESS) algorithm for
    ordinal regression problem.

    Parameters
    ----------
    splicing_type: {0, 1}, optional, default=0
        The type of splicing:
        "0" for decreasing by half, "1" for decresing by one.
    important_search : int, optional, default=128
        The size of inactive set during updating active set when splicing.
        It should be a non-positive integer and if important_search=0,
        it would be set as the size of whole inactive set.

    Examples
    --------
    Results may differ with different version of numpy.

    >>> ### Sparsity known
    >>>
    >>> from abess.linear import OrdinalRegression
    >>> from abess.datasets import make_glm_data
    >>> import numpy as np
    >>> np.random.seed(12345)
    >>> data = make_glm_data(n = 1000, p = 50, k = 10, family = 'ordinal')
    >>> model = OrdinalRegression(support_size = 10)
    >>> model.fit(data.x, data.y)
    OrdinalRegression(support_size=10)
    >>> model.predict(data.x)[:10]
    array([2, 1, 1, 1, 2, 0, 2, 1, 2, 1])

    >>> ### Sparsity unknown
    >>>
    >>> # path_type="seq"
    >>> model = OrdinalRegression(path_type = "seq")
    >>> model.fit(data.x, data.y)
    OrdinalRegression()
    >>> model.predict(data.x)[:10]
    array([2, 1, 1, 1, 2, 0, 2, 1, 2, 1])
    >>>
    >>> # path_type="gs"
    >>> model = OrdinalRegression(path_type="gs")
    >>> model.fit(data.x, data.y)
    OrdinalRegression(path_type='gs')
    >>> model.predict(data.x)[:10]
    array([2, 1, 1, 1, 2, 0, 2, 1, 2, 1])
    """

[docs]    def __init__(self, path_type="seq", support_size=None,
                 s_min=None, s_max=None, group=None, alpha=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 thread=1, A_init=None,
                 always_select=None, max_iter=20, exchange_num=5,
                 is_warm_start=True, splicing_type=0,
                 important_search=128, screening_size=-1,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False
                 ):
        super().__init__(
            algorithm_type="abess", model_type="Ordinal", normalize_type=2,
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )

    def __sklearn_tags__(self):
        # Provide classifier_tags even though _estimator_type is not set,
        # to avoid AttributeError when sklearn's sparse check accesses
        # tags.classifier_tags.multi_class for estimators with predict_proba.
        try:
            from sklearn.utils._tags import ClassifierTags
        except ImportError:
            try:
                from sklearn.utils.estimator_tags import ClassifierTags
            except ImportError:
                ClassifierTags = None
        tags = super().__sklearn_tags__()
        if ClassifierTags is not None and tags.classifier_tags is None:
            tags.classifier_tags = ClassifierTags()
        if tags.classifier_tags is not None:
            tags.classifier_tags.multi_class = True
        tags.no_validation = True
        return tags

    def predict_proba(self, X):
        r"""
        Give the probabilities of new sample
        being assigned to different classes.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        proba : array-like, shape(n_samples, M_classes)
            Returns the probabilities for each class
            on given X.
        """
        X = new_data_check(self, X)
        K = len(self.intercept_)  # number of classes (intercept_ has K entries)
        # Use only the first K-1 entries as thresholds (last entry is unused)
        cdf = (X @ self.coef_)[:, np.newaxis] + self.intercept_[:-1]
        cdf = 1 / (1 + np.exp(-cdf))
        proba = np.zeros((X.shape[0], K))
        proba[:, 0] = cdf[:, 0]
        proba[:, 1:-1] = cdf[:, 1:] - cdf[:, :-1]
        proba[:, -1] = 1 - cdf[:, -1]
        return proba

    def predict(self, X):
        r"""
        Return the most possible class label (start from 0) for given data.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Sample matrix to be predicted.

        Returns
        -------
        y : array-like, shape(n_samples,)
            Predict class labels for samples in X.
        """
        proba = self.predict_proba(X)
        return self.classes_[np.argmax(proba, axis=1)]

    def score(self, X, y, k=None, sample_weight=None, ignore_ties=False):
        """
        Give new data, and it returns normalized discounted cumulative gain.

        Parameters
        ----------
        X : array-like, shape(n_samples, p_features)
            Test data.
        y : array-like, shape(n_samples, )
            Test response (class labels for samples in X).
        k : int, default=None
            Only consider the highest k scores in the ranking.
            If None, use all outputs.
        sample_weight: array-like, shape(n_samples,), default=None
            Sample weights.
        ignore_ties : bool, default=False
            Assume that there are no ties in y_pred
            (which is likely to be the case if y_score is continuous)
            for efficiency gains.

        Returns
        -------
        score : float
             normalized discounted cumulative gain
        """
        if sample_weight is None:
            sample_weight = np.ones(len(y))
        X, y, sample_weight = new_data_check(self, X, y, sample_weight)
        unique_ = np.unique(y)
        class_num = len(unique_)
        for i in range(class_num):
            y[y == unique_[i]] = i
        y_true = class_num - 1 - abs(np.tile(np.arange(len(unique_)),
                                             (len(y), 1)) - y[..., np.newaxis])
        y_score = self.predict_proba(X)
        ndcg = ndcg_score(y_true, y_score, k=k,
                          sample_weight=sample_weight, ignore_ties=ignore_ties)
        return ndcg


class abessLogistic(LogisticRegression):
    warning_msg = ("Class ``abessLogistic`` has been renamed to "
                   "``LogisticRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + LogisticRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="roc_auc",
                 screening_size=-1,
                 always_select=None,
                 primary_model_fit_max_iter=10, primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False,
                 thread=1,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128,
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessLm(LinearRegression):
    warning_msg = ("Class ``abessLm`` has been renamed to"
                   " ``LinearRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + LinearRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 thread=1, covariance_update=False,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128,
                 # primary_model_fit_max_iter=10,
                 # primary_model_fit_epsilon=1e-8, approximate_Newton=False
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            thread=thread, covariance_update=covariance_update,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessCox(CoxPHSurvivalAnalysis):
    warning_msg = ("Class ``abessCox`` has been renamed to "
                   "``CoxPHSurvivalAnalysis``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + CoxPHSurvivalAnalysis.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 primary_model_fit_max_iter=10, primary_model_fit_epsilon=1e-8,
                 approximate_Newton=False,
                 thread=1,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessPoisson(PoissonRegression):
    warning_msg = ("Class ``abessPoisson`` has been renamed to "
                   "``PoissonRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + PoissonRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 primary_model_fit_max_iter=10, primary_model_fit_epsilon=1e-8,
                 thread=1,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessMultigaussian(MultiTaskRegression):
    warning_msg = ("Class ``abessMultigaussian`` has been renamed to "
                   "``MultiTaskRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + MultiTaskRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 thread=1, covariance_update=False,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            thread=thread, covariance_update=covariance_update,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessMultinomial(MultinomialRegression):
    warning_msg = ("Class ``abessMultinomial`` has been renamed to "
                   "``MultinomialRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + MultinomialRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None,
                 alpha=None, s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 primary_model_fit_max_iter=10, primary_model_fit_epsilon=1e-8,
                 # approximate_Newton=False,
                 thread=1,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            # approximate_Newton=approximate_Newton,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )


class abessGamma(GammaRegression):
    warning_msg = ("Class ``abessGamma`` has been renamed to "
                   "``GammaRegression``. "
                   "The former will be deprecated in version 0.6.0.")
    __doc__ = warning_msg + '\n' + GammaRegression.__doc__

    def __init__(self, max_iter=20, exchange_num=5, path_type="seq",
                 is_warm_start=True, support_size=None, alpha=None,
                 s_min=None, s_max=None,
                 ic_type="ebic", ic_coef=1.0, cv=1, cv_score="test_loss",
                 screening_size=-1,
                 always_select=None,
                 primary_model_fit_max_iter=10,
                 primary_model_fit_epsilon=1e-8,
                 thread=1,
                 A_init=None,
                 group=None,
                 splicing_type=0,
                 important_search=128
                 ):
        warnings.warn(self.warning_msg, FutureWarning)
        super().__init__(
            path_type=path_type, max_iter=max_iter, exchange_num=exchange_num,
            is_warm_start=is_warm_start, support_size=support_size,
            alpha=alpha, s_min=s_min, s_max=s_max,
            ic_type=ic_type, ic_coef=ic_coef, cv=cv, cv_score=cv_score,
            screening_size=screening_size,
            always_select=always_select,
            primary_model_fit_max_iter=primary_model_fit_max_iter,
            primary_model_fit_epsilon=primary_model_fit_epsilon,
            thread=thread,
            A_init=A_init, group=group,
            splicing_type=splicing_type,
            important_search=important_search
        )