is_gradient_based_opt_v and is_gradient_free_opt_v concepts, nelder_mead callbacks support, gradient-free optimizers expose x_curr and obj_curr

AlePalu · AlePalu · commit 00e531249308 · 2025-07-23T10:09:16.000+02:00
diff --git a/fdaPDE/optimization.h b/fdaPDE/optimization.h
@@ -24,6 +24,39 @@
 #include "utility.h"
 #include "fields.h"
 
+namespace fdapde {
+
+template <typename Opt> struct is_gradient_based_opt {
+   private:
+    using Opt_ = std::decay_t<Opt>;
+    static constexpr int N = Opt_::static_input_size;
+    using vector_t = std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, 1>, Eigen::Matrix<double, N, 1>>;
+   public:
+    static constexpr bool value = !Opt_::gradient_free && requires(Opt_ opt) {
+        { opt.x_old    } -> std::convertible_to<vector_t>;
+        { opt.x_new    } -> std::convertible_to<vector_t>;
+        { opt.update   } -> std::convertible_to<vector_t>;
+        { opt.grad_old } -> std::convertible_to<vector_t>;
+        { opt.grad_new } -> std::convertible_to<vector_t>;
+    };
+};
+template <typename Opt> static constexpr bool is_gradient_based_opt_v = is_gradient_based_opt<Opt>::value;
+
+template <typename Opt> struct is_gradient_free_opt {
+   private:
+    using Opt_ = std::decay_t<Opt>;
+    static constexpr int N = Opt_::static_input_size;
+    using vector_t = std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, 1>, Eigen::Matrix<double, N, 1>>;
+   public:
+    static constexpr bool value = Opt_::gradient_free && requires(Opt_ opt) {
+        { opt.x_curr   } -> std::convertible_to<vector_t>;
+	{ opt.obj_curr } -> std::convertible_to<double>;
+    };
+};
+template <typename Opt> static constexpr bool is_gradient_free_opt_v = is_gradient_free_opt<Opt>::value;
+  
+}   // namespace fdapde
+
 // callbacks
 #include "src/optimization/callbacks.h"
 #include "src/optimization/backtracking.h"
diff --git a/fdaPDE/src/optimization/backtracking.h b/fdaPDE/src/optimization/backtracking.h
@@ -21,7 +21,7 @@
 
 namespace fdapde {
 
-// implementation of the backatracking line search method for step selection
+// backtracking line search method for adaptive step size
 class BacktrackingLineSearch {
    private:
     double alpha_, beta_, gamma_;
@@ -32,6 +32,7 @@ class BacktrackingLineSearch {
 
     // backtracking based step search
     template <typename Opt, typename Obj> bool adapt_hook(Opt& opt, Obj& obj) {
+        fdapde_static_assert(is_gradient_based_opt_v<Opt>, THIS_METHOD_IS_FOR_GRADIENT_BASED_OPTIMIZATION_ONLY);
         double alpha = alpha_;   // restore to user defined settings
         double m = opt.grad_old.dot(opt.update);
         if (m < 0) {                                                      // descent direction
diff --git a/fdaPDE/src/optimization/bfgs.h b/fdaPDE/src/optimization/bfgs.h
@@ -37,6 +37,8 @@ template <int N> class BFGS {
     double tol_;       // tolerance on error before forced stop
     double step_;      // update step
    public:
+    static constexpr bool gradient_free = false;
+    static constexpr int static_input_size = N;
     vector_t x_old, x_new, update, grad_old, grad_new;
     double h;
     // constructor
diff --git a/fdaPDE/src/optimization/conjugate_gradient.h b/fdaPDE/src/optimization/conjugate_gradient.h
@@ -37,6 +37,8 @@ template <int N, typename DirectionUpdate> class conjugate_gradient_impl {
     double tol_;       // tolerance on error before forced stop
     double step_;      // update step
    public:
+    static constexpr bool gradient_free = false;
+    static constexpr int static_input_size = N;
     vector_t x_old, x_new, update, grad_old, grad_new;
     double h;
     // constructor
diff --git a/fdaPDE/src/optimization/gradient_descent.h b/fdaPDE/src/optimization/gradient_descent.h
@@ -36,6 +36,8 @@ template <int N> class GradientDescent {
     double tol_;     // tolerance on error before forced stop
     double step_;    // update step
    public:
+    static constexpr bool gradient_free = false;
+    static constexpr int static_input_size = N;
     vector_t x_old, x_new, update, grad_old, grad_new;
     double h;
     // constructor
diff --git a/fdaPDE/src/optimization/grid_search.h b/fdaPDE/src/optimization/grid_search.h
@@ -31,13 +31,13 @@ template <int N> class GridSearch {
     std::vector<double> values_;   // explored objective values during optimization
     int size_;
    public:
-    vector_t x_old, x_new;
-    double obj_old, obj_new;
+    static constexpr bool gradient_free = true;
+    static constexpr int static_input_size = N;
+    vector_t x_curr;
+    double obj_curr;
     // constructor
-    GridSearch()
-        requires(N != Dynamic)
-        : size_(N) { }
-    GridSearch(int size) : size_(N == Dynamic ? size : N) { }
+    GridSearch() : size_(N) { fdapde_static_assert(N != Dynamic, THIS_METHOD_IS_FOR_STATIC_SIZED_GRID_SEARCH_ONLY); }
+    GridSearch(int size) : size_(N == Dynamic ? size : N) { fdapde_assert(N == Dynamic || size == N); }
     GridSearch(const GridSearch& other) : size_(other.size_) { }
     GridSearch& operator=(const GridSearch& other) {
         size_ = other.size_;
@@ -61,29 +61,26 @@ template <int N> class GridSearch {
             grid_ = grid_t(grid.data(), grid.rows(), size_);
         }
         bool stop = false;   // asserted true in case of forced stop
-        grid_.row(0).assign_to(x_old);
-        x_new = vector_t::Constant(size_, NaN);
-        obj_old = objective(x_old);
-        obj_new = NaN;
+        grid_.row(0).assign_to(x_curr);
+        obj_curr = objective(x_curr);
         stop |= internals::exec_eval_hooks(*this, objective, callbacks_);
-        values_.push_back(obj_old);
-        if (obj_old < value_) {
-            value_ = obj_old;
-            optimum_ = x_old;
+        values_.push_back(obj_curr);
+        if (obj_curr < value_) {
+            value_ = obj_curr;
+            optimum_ = x_curr;
         }
         // optimize field over supplied grid
         for (std::size_t i = 1; i < grid_.rows() && !stop; ++i) {
-            grid_.row(i).assign_to(x_new);
-            obj_new = objective(x_new);
+            grid_.row(i).assign_to(x_curr);
+            obj_curr = objective(x_curr);
             stop |= internals::exec_eval_hooks(*this, objective, callbacks_);
-            values_.push_back(obj_new);
+            values_.push_back(obj_curr);
             // update minimum if better optimum found
-            if (obj_new < value_) {
-                value_ = obj_new;
-                optimum_ = x_new;
+            if (obj_curr < value_) {
+                value_ = obj_curr;
+                optimum_ = x_curr;
             }
-            obj_old = obj_new;
-            x_old = x_new;
+            stop |= internals::exec_stop_if(*this, objective);
         }
         return optimum_;
     }
diff --git a/fdaPDE/src/optimization/lbfgs.h b/fdaPDE/src/optimization/lbfgs.h
@@ -38,6 +38,8 @@ template <int N> class LBFGS {
     int mem_size_ = 10;   // number of vector used for approximating the objective hessian
     Eigen::Matrix<double, Dynamic, Dynamic> grad_mem_, x_mem_;
    public:
+    static constexpr bool gradient_free = false;
+    static constexpr int static_input_size = N;
     vector_t x_old, x_new, update, grad_old, grad_new;
     double h;
     // constructors
@@ -127,184 +129,3 @@ template <int N> class LBFGS {
 }   // namespace fdapde
 
 #endif   // __FDAPDE_LBFGS_H__
-
-
-// This file is part of fdaPDE, a C++ library for physics-informed
-// spatial and functional data analysis.
-//
-// This program is free software: you can redistribute it and/or modify
-// it under the terms of the GNU General Public License as published by
-// the Free Software Foundation, either version 3 of the License, or
-// (at your option) any later version.
-//
-// This program is distributed in the hope that it will be useful,
-// but WITHOUT ANY WARRANTY; without even the implied warranty of
-// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-// GNU General Public License for more details.
-//
-// You should have received a copy of the GNU General Public License
-// along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-// #ifndef __FDAPDE_LBFGS_H__
-// #define __FDAPDE_LBFGS_H__
-
-// #include "header_check.h"
-
-// namespace fdapde {
-
-// // Implementation of Broyden–Fletcher–Goldfarb–Shanno algorithm for unconstrained nonlinear optimization with optimized
-// // memory usage
-// template <int N, typename... Args> class LBFGS {
-//    private:
-//     using vector_t = std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, 1>, Eigen::Matrix<double, N, 1>>;
-//     using matrix_t =
-//       std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, Dynamic>, Eigen::Matrix<double, N, N>>;
-
-//     std::tuple<Args...> callbacks_;
-//     vector_t optimum_;
-//     double value_;           // objective value at optimum
-//     int max_iter_;           // maximum number of iterations before forced stop
-//     int n_iter_ = 0;         // current iteration number
-//     double tol_;             // tolerance on error before forced stop
-//     double step_;            // update step
-//     int mem_size_ = 10;   // number of vector used for approximating the objective hessian
-//     Eigen::Matrix<double, Dynamic, Dynamic> grad_mem_, x_mem_;
-//    public:
-//     vector_t x_old, x_new, update, grad_old, grad_new;
-//     double h;
-//     // constructors
-//     LBFGS() = default;
-//     LBFGS(int max_iter, double tol, double step, int mem_size)
-//     requires(sizeof...(Args) != 0) : max_iter_(max_iter), tol_(tol), step_(step), mem_size_(mem_size) {
-//         fdapde_assert(mem_size_ >= 0);
-//     }
-//     LBFGS(int max_iter, double tol, double step, int mem_size, Args&&... callbacks) :
-//         callbacks_(std::make_tuple(std::forward<Args>(callbacks)...)),
-//         max_iter_(max_iter),
-//         tol_(tol),
-//         step_(step),
-//         mem_size_(mem_size) {
-//         assert(mem_size_ >= 0);
-//     }
-//     // copy semantic
-//     LBFGS(const LBFGS& other) :
-//         callbacks_(other.callbacks_),
-// 	max_iter_(other.max_iter_), tol_(other.tol_), step_(other.step_), mem_size_(other.mem_size_) { }
-//     LBFGS& operator=(const LBFGS& other) {
-//         callbacks_ = other.callbacks_;
-//         max_iter_ = other.max_iter_;
-//         tol_ = other.tol_;
-//         step_ = other.step_;
-//         mem_size_ = other.mem_size_;
-//         return *this;
-//     }
-
-//     template <typename ObjectiveT, typename... Functor>
-//         requires(sizeof...(Functor) < 2) && ((requires(Functor f, double value) { f(value); }) && ...)
-//     vector_t optimize(ObjectiveT&& objective, const vector_t& x0, Functor&&... func) {
-//         fdapde_static_assert(
-//             std::is_same<decltype(std::declval<ObjectiveT>().operator()(vector_t())) FDAPDE_COMMA double>::value,
-//             INVALID_CALL_TO_OPTIMIZE__OBJECTIVE_FUNCTOR_NOT_ACCEPTING_VECTORTYPE);
-//         bool stop = false;   // asserted true in case of forced stop
-//         double error = 0;
-//         double gamma = 1.0;
-//         auto grad = objective.gradient();
-//         n_iter_ = 0;
-//         h = step_;
-//         x_old = x0, x_new = x0;
-//         vector_t zero;
-//         if constexpr (N == Dynamic) {
-//             zero = vector_t::Zero(x0.rows());
-//         } else {
-//             zero = vector_t::Zero();
-//         }
-//         update = zero;
-//         grad_old = grad(x_old);
-//         if (grad_old.isApprox(zero)) {   // already at stationary point
-//             optimum_ = x_old;
-//             value_ = objective(optimum_);
-//             if constexpr (sizeof...(Functor) == 1) { (func(value_), ...); }
-//             return optimum_;
-//         }
-//         error = grad_old.norm();
-//         x_mem_.resize(x0.rows(), mem_size_);
-//         grad_mem_.resize(x0.rows(), mem_size_);
-
-//         while (n_iter_ < max_iter_ && error > tol_ && !stop) {
-//             // compute update direction
-//             vector_t q = grad_old;
-//             int current_mem = n_iter_ < mem_size_ ? n_iter_ : mem_size_;
-//             std::vector<double> alpha(current_mem, 0);
-//             for (int i = 0; std::cmp_less(i, current_mem); ++i) {
-//                 int k = (n_iter_ + mem_size_ - i - 1) % mem_size_;
-//                 alpha[i] = x_mem_.col(k).dot(q) / grad_mem_.col(k).dot(x_mem_.col(k));
-//                 q -= alpha[i] * grad_mem_.col(k);
-// 		std::cout << "aggiorno q" << std::endl;
-//             }
-//             // H_0^k = I (initial guess of the inverse hessian)
-// 	    std::cout << "q: " << q.transpose() << std::endl;
-// 	    std::cout << "gamma: " << gamma << std::endl;
-
-//             update = -gamma * q;
-	    
-//             for (int i = current_mem - 1; i >= 0; --i) {
-//                 int k = (n_iter_ + mem_size_ - i - 1) % mem_size_;
-//                 double beta = grad_mem_.col(k).dot(update) / grad_mem_.col(k).dot(x_mem_.col(k));
-//                 update -= x_mem_.col(k) * (alpha[i] + beta);
-//             }
-
-// 	    std::cout << update << std::endl;
-// 	    std::cout << "----" << std::endl;
-
-	    
-//             stop |= internals::exec_adapt_hooks(*this, objective, callbacks_);
-//             // update along descent direction
-// 	    std::cout << "h: " << h << std::endl;
-// 	    std::cout << "x_old: " << x_old.transpose() << std::endl;
-//             x_new = x_old + h * update;
-//             grad_new = grad(x_new);
-
-
-// 	    std::cout << "grad_new: " << grad_new.transpose() << std::endl;
-// 	    std::cout << "x_new:    " << x_new.transpose() << std::endl;
-
-	    
-//             if (grad_new.isApprox(zero)) {   // already at stationary point
-//                 optimum_ = x_old;
-//                 value_ = objective(optimum_);
-//                 if constexpr (sizeof...(Functor) == 1) { (func(value_), ...); }
-//                 return optimum_;
-//             }
-//             // mem update
-//             // update inverse Hessian approximation
-//             int col_idx = n_iter_ % mem_size_;
-//             grad_mem_.col(col_idx) = grad_new - grad_old;
-//             x_mem_.col(col_idx) = x_new - x_old;
-//             gamma = x_mem_.col(col_idx).dot(grad_mem_.col(col_idx)) / grad_mem_.col(col_idx).norm();
-
-// 	    std::cout << "q: " << q.transpose() << std::endl;
-// 	    std::cout << "gamma: " << gamma << std::endl;
-	    
-//             // prepare next iteration
-//             if constexpr (sizeof...(Functor) == 1) { (func(objective(x_old)), ...); }
-//             error = grad_new.norm();
-//             // stop |=
-//             //   (execute_post_update_step(*this, objective, callbacks_) || execute_stopping_criterion(*this, objective));
-//             x_old = x_new;
-//             grad_old = grad_new;
-//             ++n_iter_;
-//         }
-//         optimum_ = x_old;
-//         value_ = objective(optimum_);
-//         if constexpr (sizeof...(Functor) == 1) { (func(value_), ...); }
-//         return optimum_;
-//     }
-//     // observers
-//     vector_t optimum() const { return optimum_; }
-//     double value() const { return value_; }
-//     int n_iter() const { return n_iter_; }
-// };
-
-// }   // namespace fdapde
-
-// #endif   // __FDAPDE_LBFGS_H__
diff --git a/fdaPDE/src/optimization/nelder_mead.h b/fdaPDE/src/optimization/nelder_mead.h
diff --git a/fdaPDE/src/optimization/newton.h b/fdaPDE/src/optimization/newton.h
diff --git a/fdaPDE/src/optimization/wolfe.h b/fdaPDE/src/optimization/wolfe.h