libslope/slope_8h_source.html

#pragma once


#include "logger.h"

#include "screening.h"

#include "slope_fit.h"

#include "slope_path.h"

#include "solvers/hybrid_cd.h"

#include "timer.h"

#include <Eigen/Core>

#include <Eigen/SparseCore>

#include <cassert>

#include <optional>


namespace slope {


class Slope

{

public:

  Slope() = default;


  void setSolver(const std::string& solver);


  void setIntercept(bool intercept);


  void setNormalization(const std::string& type);


  void setUpdateClusters(bool update_clusters);


  void setReturnClusters(const bool return_clusters);


  void setAlphaMinRatio(double alpha_min_ratio);


  void setAlphaType(const std::string& alpha_type);


  void setLearningRateDecr(double learning_rate_decr);


  void setQ(double q);


  void setOscarParameters(const double theta1, const double theta2);


  void setTol(double tol);


  void setRelaxTol(double tol);


  void setRelaxMaxOuterIterations(int max_it);


  void setRelaxMaxInnerIterations(int max_it);


  void setMaxIterations(int max_it);


  void setPathLength(int path_length);


  void setHybridCdIterations(int cd_iterations);


  void setLambdaType(const std::string& lambda_type);


  void setLoss(const std::string& loss_type);


  void setScreening(const std::string& screening_type);


  void setModifyX(const bool modify_x);


  void setDevChangeTol(const double dev_change_tol);


  void setDevRatioTol(const double dev_ratio_tol);


  void setMaxClusters(const int max_clusters);


  void setCentering(const std::string& type);


  void setCentering(const Eigen::VectorXd& x_centers);


  void setScaling(const std::string& type);


  void setDiagnostics(const bool collect_diagnostics);


  void setScaling(const Eigen::VectorXd& x_scales);


  void setAlphaEstimationMaxIterations(const int alpha_est_maxit);


  int getAlphaEstimationMaxIterations() const;


  bool getFitIntercept() const;


  const std::string& getLossType();


  template<typename T>

  SlopePath path(T& x,

                 const Eigen::MatrixXd& y_in,

                 Eigen::ArrayXd alpha = Eigen::ArrayXd::Zero(0),

                 Eigen::ArrayXd lambda = Eigen::ArrayXd::Zero(0));


  template<typename T>

  SlopeFit fit(T& x,

               const Eigen::MatrixXd& y_in,

               const double alpha = 1.0,

               Eigen::ArrayXd lambda = Eigen::ArrayXd::Zero(0));


  template<typename T>


  SlopeFit relax(const SlopeFit& fit,

                 T& x,

                 const Eigen::VectorXd& y_in,

                 const double gamma = 0.0,

                 Eigen::VectorXd beta0 = Eigen::VectorXd(0),

                 Eigen::VectorXd beta = Eigen::VectorXd(0))

  {

    using Eigen::MatrixXd;

    using Eigen::VectorXd;


    int n = x.rows();

    int p = x.cols();


    if (beta0.size() == 0) {

      beta0 = fit.getIntercepts(false);

    }


    if (beta.size() == 0) {

      beta = fit.getCoefs(false);

    }


    double alpha = 0;


    Timer timer;


    std::vector<double> primals, duals, time;

    timer.start();


    auto jit_normalization =

      normalize(x, x_centers, x_scales, centering_type, scaling_type, modify_x);


    bool update_clusters = false;


    std::unique_ptr<Loss> loss = setupLoss(this->loss_type);


    MatrixXd y = loss->preprocessResponse(y_in);


    int m = y.cols();


    Eigen::ArrayXd lambda_relax = Eigen::ArrayXd::Zero(p * m);


    auto working_set = activeSet(beta);


    Eigen::MatrixXd eta = linearPredictor(x,

                                          working_set,

                                          beta0,

                                          beta,

                                          x_centers,

                                          x_scales,

                                          jit_normalization,

                                          intercept);

    VectorXd gradient = VectorXd::Zero(p * m);

    VectorXd residual(n);

    VectorXd working_residual(n);


    VectorXd w = VectorXd::Ones(n);

    VectorXd w_ones = VectorXd::Ones(n);

    VectorXd z = y;


    Clusters clusters = fit.getClusters();


    int passes = 0;


    for (int irls_it = 0; irls_it < max_it_outer_relax; irls_it++) {

      residual = loss->residual(eta, y);


      if (collect_diagnostics) {

        primals.push_back(loss->loss(eta, y));

        duals.push_back(0.0);

        time.push_back(timer.elapsed());

      }


      Eigen::VectorXd cluster_gradient = clusterGradient(beta,

                                                         residual,

                                                         clusters,

                                                         x,

                                                         w_ones,

                                                         x_centers,

                                                         x_scales,

                                                         jit_normalization);


      double norm_grad = cluster_gradient.lpNorm<Eigen::Infinity>();


      if (norm_grad < tol_relax) {

        break;

      }


      loss->updateWeightsAndWorkingResponse(w, z, eta, y);

      working_residual = eta - z;


      for (int inner_it = 0; inner_it < max_it_inner_relax; ++inner_it) {

        passes++;


        double max_abs_gradient = coordinateDescent(beta0,

                                                    beta,

                                                    working_residual,

                                                    clusters,

                                                    lambda_relax,

                                                    x,

                                                    w,

                                                    x_centers,

                                                    x_scales,

                                                    intercept,

                                                    jit_normalization,

                                                    update_clusters);


        if (max_abs_gradient < tol_relax) {

          break;

        }

      }


      eta = working_residual + z;


      if (irls_it == max_it_outer_relax) {

        WarningLogger::addWarning(WarningCode::MAXIT_REACHED,

                                  "Maximum number of IRLS iterations reached.");

      }

    }


    double dev = loss->deviance(eta, y);


    if (gamma > 0) {

      Eigen::VectorXd old_coefs = fit.getCoefs(false);

      Eigen::VectorXd old_intercept = fit.getIntercepts(false);

      beta = (1 - gamma) * beta + gamma * old_coefs;

    }


    SlopeFit fit_out{ beta0,

                      beta.reshaped(p, m).sparseView(),

                      clusters,

                      alpha,

                      lambda_relax,

                      dev,

                      fit.getNullDeviance(),

                      primals,

                      duals,

                      time,

                      passes,

                      centering_type,

                      scaling_type,

                      intercept,

                      x_centers,

                      x_scales };


    return fit_out;

  }


  template<typename T>


  SlopePath relax(const SlopePath& path,

                  T& x,

                  const Eigen::VectorXd& y,

                  const double gamma = 0.0)

  {

    std::vector<SlopeFit> fits;


    Eigen::VectorXd beta0 = path(0).getIntercepts(false);

    Eigen::VectorXd beta = path(0).getCoefs(false);


    for (size_t i = 0; i < path.size(); i++) {

      auto relaxed_fit = relax(path(i), x, y, gamma, beta0, beta);


      fits.emplace_back(relaxed_fit);


      // Update warm starts

      // TODO: Maybe be more clever about whether to use the

      // previous values or the regularized estimates and warm starts.

      // Maybe just pick the solution with larger coefficients?

      beta0 = relaxed_fit.getIntercepts(false);

      beta = relaxed_fit.getCoefs(false);

    }


    return fits;

  }


private:

  // Parameters

  bool collect_diagnostics = false;

  bool intercept = true;

  bool modify_x = false;

  bool return_clusters = true;

  bool update_clusters = false;

  double alpha_min_ratio = -1;

  double dev_change_tol = 1e-5;

  double dev_ratio_tol = 0.999;

  double learning_rate_decr = 0.5;

  double q = 0.1;

  double theta1 = 1.0;

  double theta2 = 0.5;

  double tol = 1e-4;

  double tol_relax = 1e-4;

  int alpha_est_maxit = 1000;

  int cd_iterations = 10;

  int max_it = 1e4;

  int max_it_inner_relax = 1e5;

  int max_it_outer_relax = 50;

  int path_length = 100;

  std::optional<int> max_clusters = std::nullopt;

  std::string alpha_type = "path";

  std::string centering_type = "mean";

  std::string lambda_type = "bh";

  std::string loss_type = "quadratic";

  std::string scaling_type = "sd";

  std::string screening_type = "strong";

  std::string solver_type = "auto";


  // Data

  Eigen::VectorXd x_centers;

  Eigen::VectorXd x_scales;

};


} // namespace slope

slope::Clusters
Representation of the clusters in SLOPE.
Definition clusters.h:18

slope::SlopeFit
A class representing the results of SLOPE (Sorted L1 Penalized Estimation) fitting.
Definition slope_fit.h:27

slope::SlopeFit::getClusters
const Clusters & getClusters() const
Gets the clusters.
Definition slope_fit.h:151

slope::SlopeFit::getIntercepts
Eigen::VectorXd getIntercepts(const bool original_scale=true) const
Gets the intercept terms for this SLOPE fit.
Definition slope_fit.h:113

slope::SlopeFit::getCoefs
Eigen::SparseMatrix< double > getCoefs(const bool original_scale=true) const
Gets the sparse coefficient matrix for this fit.
Definition slope_fit.h:133

slope::SlopeFit::getNullDeviance
double getNullDeviance() const
Gets the null model deviance.
Definition slope_fit.h:176

slope::SlopePath
Container class for SLOPE regression solution paths.
Definition slope_path.h:31

slope::SlopePath::getIntercepts
std::vector< Eigen::VectorXd > getIntercepts(const bool original_scale=true) const
Returns the vector of intercept terms for each solution in the path.
Definition slope_path.h:74

slope::SlopePath::size
std::size_t size() const
Gets the number of solutions in the path.
Definition slope_path.h:255

slope::SlopePath::getCoefs
std::vector< Eigen::SparseMatrix< double > > getCoefs(const bool original_scale=true) const
Returns the vector of coefficient matrices for each solution in the path.
Definition slope_path.h:96

slope::Slope
The SLOPE model.
Definition slope.h:33

slope::Slope::setSolver
void setSolver(const std::string &solver)
Sets the numerical solver used to fit the model.
Definition slope.cpp:341

slope::Slope::setAlphaMinRatio
void setAlphaMinRatio(double alpha_min_ratio)
Sets the alpha min ratio.
Definition slope.cpp:423

slope::Slope::setMaxIterations
void setMaxIterations(int max_it)
Sets the maximum number of iterations.
Definition slope.cpp:502

slope::Slope::setAlphaEstimationMaxIterations
void setAlphaEstimationMaxIterations(const int alpha_est_maxit)
Sets the maximum number of iterations for the alpha estimation procedure.
Definition slope.cpp:596

slope::Slope::setRelaxMaxInnerIterations
void setRelaxMaxInnerIterations(int max_it)
Sets the maximum number of inner iterations for the relaxed solver.
Definition slope.cpp:493

slope::Slope::path
SlopePath path(T &x, const Eigen::MatrixXd &y_in, Eigen::ArrayXd alpha=Eigen::ArrayXd::Zero(0), Eigen::ArrayXd lambda=Eigen::ArrayXd::Zero(0))
Computes SLOPE regression solution path for multiple alpha and lambda values.
Definition slope.cpp:27

slope::Slope::setDevRatioTol
void setDevRatioTol(const double dev_ratio_tol)
Sets tolerance in deviance change for early stopping.
Definition slope.cpp:570

slope::Slope::setScaling
void setScaling(const std::string &type)
Sets the scaling type.
Definition slope.cpp:389

slope::Slope::fit
SlopeFit fit(T &x, const Eigen::MatrixXd &y_in, const double alpha=1.0, Eigen::ArrayXd lambda=Eigen::ArrayXd::Zero(0))
Fits a single SLOPE regression model for given alpha and lambda values.
Definition slope.cpp:328

slope::Slope::setDevChangeTol
void setDevChangeTol(const double dev_change_tol)
Sets tolerance in deviance change for early stopping.
Definition slope.cpp:560

slope::Slope::getLossType
const std::string & getLossType()
Get currently defined loss type.
Definition slope.cpp:614

slope::Slope::setReturnClusters
void setReturnClusters(const bool return_clusters)
Sets the return clusters flag.
Definition slope.cpp:410

slope::Slope::setRelaxMaxOuterIterations
void setRelaxMaxOuterIterations(int max_it)
Sets the maximum number of outer (IRLS) iterations for the relaxed solver.
Definition slope.cpp:484

slope::Slope::setMaxClusters
void setMaxClusters(const int max_clusters)
Sets the maximum number of clusters.
Definition slope.cpp:580

slope::Slope::setIntercept
void setIntercept(bool intercept)
Sets the intercept flag.
Definition slope.cpp:348

slope::Slope::getFitIntercept
bool getFitIntercept() const
Returns the intercept flag.
Definition slope.cpp:608

slope::Slope::setDiagnostics
void setDiagnostics(const bool collect_diagnostics)
Toggles collection of diagnostics.
Definition slope.cpp:590

slope::Slope::setNormalization
void setNormalization(const std::string &type)
Sets normalization type for the design matrix.
Definition slope.cpp:354

slope::Slope::relax
SlopeFit relax(const SlopeFit &fit, T &x, const Eigen::VectorXd &y_in, const double gamma=0.0, Eigen::VectorXd beta0=Eigen::VectorXd(0), Eigen::VectorXd beta=Eigen::VectorXd(0))
Relaxes a fitted SLOPE model.
Definition slope.h:373

slope::Slope::getAlphaEstimationMaxIterations
int getAlphaEstimationMaxIterations() const
Gets the maximum number of iterations allowed for the alpha estimation procedure.
Definition slope.cpp:602

slope::Slope::setScreening
void setScreening(const std::string &screening_type)
Sets the type of feature screening used, which discards predictors that are unlikely to be active.
Definition slope.cpp:547

slope::Slope::setOscarParameters
void setOscarParameters(const double theta1, const double theta2)
Sets OSCAR parameters.
Definition slope.cpp:450

slope::Slope::setLambdaType
void setLambdaType(const std::string &lambda_type)
Sets the lambda type for regularization weights.
Definition slope.cpp:529

slope::Slope::setAlphaType
void setAlphaType(const std::string &alpha_type)
Sets the alpha type.
Definition slope.cpp:416

slope::Slope::setModifyX
void setModifyX(const bool modify_x)
Controls if x should be modified-in-place.
Definition slope.cpp:554

slope::Slope::setCentering
void setCentering(const std::string &type)
Sets the center points for feature normalization.
Definition slope.cpp:375

slope::Slope::Slope
Slope()=default

slope::Slope::setLearningRateDecr
void setLearningRateDecr(double learning_rate_decr)
Sets the learning rate decrement.
Definition slope.cpp:432

slope::Slope::setLoss
void setLoss(const std::string &loss_type)
Sets the loss function type.
Definition slope.cpp:538

slope::Slope::relax
SlopePath relax(const SlopePath &path, T &x, const Eigen::VectorXd &y, const double gamma=0.0)
Relaxes a fitted SLOPE path.
Definition slope.h:533

slope::Slope::setRelaxTol
void setRelaxTol(double tol)
Sets the tolerance value for the relaxed SLOPE solver.
Definition slope.cpp:474

slope::Slope::setPathLength
void setPathLength(int path_length)
Sets the path length.
Definition slope.cpp:511

slope::Slope::setHybridCdIterations
void setHybridCdIterations(int cd_iterations)
Sets the frequence of proximal gradient descent steps.
Definition slope.cpp:520

slope::Slope::setTol
void setTol(double tol)
Sets the tolerance value.
Definition slope.cpp:465

slope::Slope::setQ
void setQ(double q)
Sets the q value.
Definition slope.cpp:441

slope::Slope::setUpdateClusters
void setUpdateClusters(bool update_clusters)
Sets the update clusters flag.
Definition slope.cpp:404

slope::Timer
Timer class for measuring elapsed time with high resolution.
Definition timer.h:19

slope::Timer::start
void start()
Starts the timer by recording the current time point.
Definition timer.cpp:6

slope::Timer::elapsed
double elapsed() const
Returns the elapsed time in seconds since start() was called.
Definition timer.cpp:34

slope::WarningLogger::addWarning
static void addWarning(WarningCode code, const std::string &message)
Log a new warning.
Definition logger.cpp:31

hybrid_cd.h
An implementation of the coordinate descent step in the hybrid algorithm for solving SLOPE.

logger.h
Thread-safe warning logging facility for the slope library.

slope
Namespace containing SLOPE regression implementation.
Definition clusters.cpp:5

slope::coordinateDescent
double coordinateDescent(Eigen::VectorXd &beta0, Eigen::VectorXd &beta, Eigen::VectorXd &residual, Clusters &clusters, const Eigen::ArrayXd &lambda, const T &x, const Eigen::VectorXd &w, const Eigen::VectorXd &x_centers, const Eigen::VectorXd &x_scales, const bool intercept, const JitNormalization jit_normalization, const bool update_clusters)
Definition hybrid_cd.h:188

slope::setupLoss
std::unique_ptr< Loss > setupLoss(const std::string &loss)
Factory function to create the appropriate loss function based on the distribution family.
Definition setup_loss.cpp:10

slope::linearPredictor
Eigen::MatrixXd linearPredictor(const T &x, const std::vector< int > &active_set, const Eigen::VectorXd &beta0, const Eigen::VectorXd &beta, const Eigen::VectorXd &x_centers, const Eigen::VectorXd &x_scales, const JitNormalization jit_normalization, const bool intercept)
Definition math.h:146

slope::normalize
JitNormalization normalize(Eigen::MatrixXd &x, Eigen::VectorXd &x_centers, Eigen::VectorXd &x_scales, const std::string &centering_type, const std::string &scaling_type, const bool modify_x)
Definition normalize.cpp:6

slope::WarningCode::MAXIT_REACHED
@ MAXIT_REACHED
Maximum iterations reached without convergence.

slope::activeSet
std::vector< int > activeSet(const Eigen::VectorXd &beta)
Identifies previously active variables.
Definition screening.cpp:19

screening.h
Screening rules for SLOPE regression optimization.

slope_fit.h
SLOPE (Sorted L-One Penalized Estimation) fitting results.

slope_path.h
Defines the SlopePath class for storing and accessing SLOPE regression solution paths.

timer.h
Simple high-resolution timer class for performance measurements.