fdaPDE
diff --git a/‎fdaPDE/src/optimization/conjugate_gradient.h‎
Lines changed: 62 additions & 44 deletions b/‎fdaPDE/src/optimization/conjugate_gradient.h‎
Lines changed: 62 additions & 44 deletions
@@ -21,13 +21,14 @@
 
 namespace fdapde {
 
+namespace internals {
+
 // implementation of Conjugate Gradient method for unconstrained nonlinear optimization
-template <int N, typename... Args> class ConjugateGradient {
+template <int N, typename DirectionMethod, typename... Args> class conjugate_gradient_impl {
    private:
-    using vector_t = 
-        std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, 1>, Eigen::Matrix<double, N, 1>>;
+    using vector_t = std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, 1>, Eigen::Matrix<double, N, 1>>;
     using matrix_t =
-        std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, Dynamic>, Eigen::Matrix<double, N, N>>;
+      std::conditional_t<N == Dynamic, Eigen::Matrix<double, Dynamic, Dynamic>, Eigen::Matrix<double, N, N>>;
 
     std::tuple<Args...> callbacks_ {};
     vector_t optimum_;
@@ -36,89 +37,106 @@ template <int N, typename... Args> class ConjugateGradient {
     double tol_;       // tolerance on error before forced stop
     double step_;      // update step
     int n_iter_ = 0;   // current iteration number
-    bool use_polak_ribiere_ = true; // If set to false, use Fletcher-Reave, else use Polak-Ribière to calculate beta   
-
    public:
-    vector_t x_old, x_new, update, dir, grad_old, grad_new;
+    vector_t x_old, x_new, update, grad_old, grad_new;
     double h;
-
     // constructor
-    ConjugateGradient() = default;
-
-    ConjugateGradient(int max_iter, double tol, double step, bool use_polak_ribiere = true)
+    conjugate_gradient_impl() = default;
+    conjugate_gradient_impl(int max_iter, double tol, double step)
         requires(sizeof...(Args) != 0)
-        : max_iter_(max_iter), tol_(tol), step_(step), use_polak_ribiere_(use_polak_ribiere) { }
-
-    ConjugateGradient(int max_iter, double tol, double step, bool use_polak_ribiere, Args&&... callbacks) :
-        callbacks_(std::make_tuple(std::forward<Args>(callbacks)...)), max_iter_(max_iter), tol_(tol), step_(step), use_polak_ribiere_(use_polak_ribiere) { }
-
+        : max_iter_(max_iter), tol_(tol), step_(step) { }
+    conjugate_gradient_impl(int max_iter, double tol, double step, Args&&... callbacks) :
+        callbacks_(std::make_tuple(std::forward<Args>(callbacks)...)), max_iter_(max_iter), tol_(tol), step_(step) { }
     // copy semantic
-    ConjugateGradient(const ConjugateGradient& other) :
-        callbacks_(other.callbacks_), max_iter_(other.max_iter_), tol_(other.tol_), step_(other.step_), use_polak_ribiere_(other.use_polak_ribiere_) { }
-    
-    ConjugateGradient& operator=(const ConjugateGradient& other) {
+    conjugate_gradient_impl(const conjugate_gradient_impl& other) :
+        callbacks_(other.callbacks_), max_iter_(other.max_iter_), tol_(other.tol_), step_(other.step_) { }
+    conjugate_gradient_impl& operator=(const conjugate_gradient_impl& other) {
         max_iter_ = other.max_iter_;
         tol_ = other.tol_;
         step_ = other.step_;
         callbacks_ = other.callbacks_;
-        use_polak_ribiere_ = other.use_polak_ribiere_;
         return *this;
     }
-
     template <typename ObjectiveT, typename... Functor>
         requires(sizeof...(Functor) < 2) && ((requires(Functor f, double value) { f(value); }) && ...)
     vector_t optimize(ObjectiveT&& objective, const vector_t& x0, Functor&&... func) {
         fdapde_static_assert(
-            std::is_same<decltype(std::declval<ObjectiveT>().operator()(vector_t())) FDAPDE_COMMA double>::value,
-            INVALID_CALL_TO_OPTIMIZE__OBJECTIVE_FUNCTOR_NOT_ACCEPTING_VECTORTYPE
-        );
-        
+          std::is_same<decltype(std::declval<ObjectiveT>().operator()(vector_t())) FDAPDE_COMMA double>::value,
+          INVALID_CALL_TO_OPTIMIZE__OBJECTIVE_FUNCTOR_NOT_ACCEPTING_VECTORTYPE);
         bool stop = false;   // asserted true in case of forced stop
         double error = std::numeric_limits<double>::max();
-        double beta = 0.0;
-        h = step_;
+	DirectionMethod beta;
+        auto grad = objective.gradient();
         n_iter_ = 0;
+        h = step_;
         x_old = x0, x_new = x0;
-	    auto grad = objective.gradient();
         grad_old = grad(x_old);
-        dir = -grad_old;
+        update = -grad_old;
 
         while (n_iter_ < max_iter_ && error > tol_ && !stop) {
-            update = dir;
             stop |= execute_pre_update_step(*this, objective, callbacks_);
-
             // update along descent direction
             x_new = x_old + h * update;
             grad_new = grad(x_new);
             if constexpr (sizeof...(Functor) == 1) { (func(objective(x_old)), ...); }
-            if( use_polak_ribiere_ )
-                beta = grad_new.dot(grad_new - grad_old) / grad_old.dot(grad_old); // Polak Ribière
-            else
-                beta = grad_new.dot(grad_new) / grad_old.dot(grad_old); // Fletcher-Reeves
-
-            dir = -grad_new + beta * dir;
-
-            // prepare next iteration
+	    // prepare next iteration
+            update = -grad_new + std::max(0.0, beta(*this)) * update;   // update conjugate direction
             error = grad_new.norm();
             stop |=
               (execute_post_update_step(*this, objective, callbacks_) || execute_stopping_criterion(*this, objective));
             x_old = x_new;
             grad_old = grad_new;
-            
             n_iter_++;
         }
         optimum_ = x_old;
         value_ = objective(optimum_);
-	    if constexpr (sizeof...(Functor) == 1) { (func(value_), ...); }
+        if constexpr (sizeof...(Functor) == 1) { (func(value_), ...); }
         return optimum_;
     }
-
     // getters
     vector_t optimum() const { return optimum_; }
     double value() const { return value_; }
     int n_iter() const { return n_iter_; }
 };
 
+struct fletcher_reeves_impl {
+    template <typename Opt> double operator()(const Opt& opt) { return opt.grad_new.norm() / opt.grad_old.norm(); }
+};
+struct polak_ribiere_impl {
+    template <typename Opt> double operator()(const Opt& opt) {
+        return opt.grad_new.dot(opt.grad_new - opt.grad_old) / opt.grad_old.norm();
+    }
+};
+
+}   // namespace internals
+
+// public CG optimizers
+template <int N, typename... Args>
+class FletcherReevesCG : public internals::conjugate_gradient_impl<N, internals::fletcher_reeves_impl, Args...> {
+   private:
+    using Base = internals::conjugate_gradient_impl<N, internals::fletcher_reeves_impl, Args...>;
+   public:
+    FletcherReevesCG() = default;
+    FletcherReevesCG(int max_iter, double tol, double step)
+        requires(sizeof...(Args) != 0)
+        : Base(max_iter, tol, step) { }
+    FletcherReevesCG(int max_iter, double tol, double step, Args&&... callbacks) :
+        Base(max_iter, tol, step, callbacks...) { }
+};
+
+template <int N, typename... Args>
+class PolakRibiereCG : public internals::conjugate_gradient_impl<N, internals::polak_ribiere_impl, Args...> {
+   private:
+    using Base = internals::conjugate_gradient_impl<N, internals::polak_ribiere_impl, Args...>;
+   public:
+    PolakRibiereCG() = default;
+    PolakRibiereCG(int max_iter, double tol, double step)
+        requires(sizeof...(Args) != 0)
+        : Base(max_iter, tol, step) { }
+    PolakRibiereCG(int max_iter, double tol, double step, Args&&... callbacks) :
+        Base(max_iter, tol, step, callbacks...) { }
+};
+
 }   // namespace fdapde
 
-#endif   // __FDAPDE_CONJUGATE_GRADIENT_H__
+#endif   // __FDAPDE_CONJUGATE_GRADIENT_H__