// Copyright (C) 2016  Davis E. King (davis@dlib.net)
// License: Boost Software License   See LICENSE.txt for the full license.
#undef DLIB_ElASTIC_NET_ABSTRACT_Hh_
#ifdef DLIB_ElASTIC_NET_ABSTRACT_Hh_

#include "../matrix.h"

namespace dlib
{

// ----------------------------------------------------------------------------------------

    class elastic_net
    {
        /*!
            WHAT THIS OBJECT REPRESENTS
                This object is a tool for solving the following optimization problem:

                    min_w:      length_squared(X*w - Y) + ridge_lambda*length_squared(w)
                    such that:  sum(abs(w)) <= lasso_budget

                That is, it solves the elastic net optimization problem.  This object also
                has the special property that you can quickly obtain different solutions
                for different settings of ridge_lambda, lasso_budget, and target Y values.

                This is because a large amount of work is precomputed in the constructor.
                The solver will also remember the previous solution and will use that to
                warm start subsequent invocations.  Therefore, you can efficiently get
                solutions for a wide range of regularization parameters.
                
                
                The particular algorithm used to solve it is described in the paper:
                    Zhou, Quan, et al. "A reduction of the elastic net to support vector
                    machines with an application to gpu computing." arXiv preprint
                    arXiv:1409.1976 (2014).  APA 

                And for the SVM solver sub-component we use the algorithm from:
                    Hsieh, Cho-Jui, et al. "A dual coordinate descent method for large-scale
                    linear SVM." Proceedings of the 25th international conference on Machine
                    learning. ACM, 2008. 
        !*/

    public:

        template <typename EXP>
        explicit elastic_net(
            const matrix_exp<EXP>& XX
        ); 
        /*!
            requires
                - XX.size() != 0
                - XX.nr() == XX.nc()
            ensures
                - #get_epsilon() == 1e-5
                - #get_max_iterations() == 50000
                - This object will not be verbose unless be_verbose() is called.
                - #size() == XX.nc()
                - #have_target_values() == false
                - We interpret XX as trans(X)*X where X is as defined in the objective
                  function discussed above in WHAT THIS OBJECT REPRESENTS.
        !*/

        template <typename EXP1, typename EXP2>
        elastic_net(
            const matrix_exp<EXP1>& XX,
            const matrix_exp<EXP2>& XY
        ); 
        /*!
            requires
                - XX.size() != 0
                - XX.nr() == XX.nc()
                - is_col_vector(XY)
                - XX.nc() == Y.size()
            ensures
                - constructs this object by calling the elastic_net(XX) constructor and
                  then calling this->set_xy(XY).
                - #have_target_values() == true 
                - We interpret XX as trans(X)*X where X is as defined in the objective
                  function discussed above in WHAT THIS OBJECT REPRESENTS.  Similarly, XY
                  should be trans(X)*Y.
        !*/

        long size (
        ) const; 
        /*!
            ensures
                - returns the dimensionality of the data loaded into this object.  That is,
                  how many elements are in the optimal w vector?  This function returns
                  that number.
        !*/

        bool have_target_values (
        ) const;
        /*!
            ensures
                - returns true if set_xy() has been called and false otherwise.
        !*/

        template <typename EXP>
        void set_xy(
            const matrix_exp<EXP>& XY
        );
        /*!
            requires
                - is_col_vector(Y)
                - Y.size() == size()
            ensures
                - #have_target_values() == true
                - Sets the target values of the regression.  Note that we expect the given
                  matrix, XY, to be equal to trans(X)*Y, where X and Y have the definitions
                  discussed above in WHAT THIS OBJECT REPRESENTS.
        !*/

        void set_epsilon(
            double eps
        );
        /*!
            requires
                - eps > 0
            ensures
                - #get_epsilon() == eps
        !*/

        double get_epsilon (
        ) const;
        /*!
            ensures
                - returns the error epsilon that determines when the solver should stop.
                  Smaller values may result in a more accurate solution but take longer to
                  execute.  
        !*/

        unsigned long get_max_iterations (
        ) const; 
        /*!
            ensures
                - returns the maximum number of iterations the optimizer is allowed to run
                  before it is required to stop and return a result.
        !*/

        void set_max_iterations (
            unsigned long max_iter
        );
        /*!
            ensures
                - #get_max_iterations() == max_iter
        !*/

        void be_verbose (
        );
        /*!
            ensures
                - This object will print status messages to standard out so that a 
                  user can observe the progress of the algorithm.
        !*/

        void be_quiet (
        );
        /*!
            ensures
                - this object will not print anything to standard out.
        !*/


        matrix<double,0,1> operator() (
            double ridge_lambda,
            double lasso_budget = std::numeric_limits<double>::infinity()
        );
        /*!
            requires
                - have_target_values() == true
                - ridge_lambda > 0
                - lasso_budget > 0
            ensures
                - Solves the optimization problem described in the WHAT THIS OBJECT
                  REPRESENTS section above and returns the optimal w.
                - The returned vector has size() elements.
                - if (lasso_budget == infinity) then
                    - The lasso constraint is ignored 
        !*/

    };

// ----------------------------------------------------------------------------------------

}

#endif // DLIB_ElASTIC_NET_ABSTRACT_Hh_