NNFS/_adagrad_8hpp_source.html

#pragma once


#include <Eigen/Dense>

#include "Optimizer.hpp"


namespace NNFS

{

    class Adagrad : public Optimizer

    {

    public:

        Adagrad(double lr, double decay = 0.0, double epsilon = 1e-7) : Optimizer(lr, decay),

                                                                        _epsilon(epsilon) {}


        void update_params(std::shared_ptr<Dense> &layer)

        {

            Eigen::MatrixXd weights = layer->weights();

            Eigen::MatrixXd biases = layer->biases();

            Eigen::MatrixXd dweights = layer->dweights();

            Eigen::MatrixXd dbiases = layer->dbiases();


            Eigen::MatrixXd weights_cache = layer->weights_optimizer();

            Eigen::MatrixXd biases_cache = layer->biases_optimizer();


            weights_cache += dweights.cwisePow(2);

            biases_cache += dbiases.cwisePow(2);


            weights += (-_current_lr * dweights.array() / (weights_cache.array().sqrt() + _epsilon)).matrix();

            biases += (-_current_lr * dbiases.array() / (biases_cache.array().sqrt() + _epsilon)).matrix();


            layer->weights_optimizer(weights_cache);

            layer->biases_optimizer(biases_cache);


            layer->weights(weights);

            layer->biases(biases);

        }


    private:

        double _epsilon; // Epsilon - to avoid division by zero

    };

} // namespace NNFS

Optimizer.hpp

NNFS::Adagrad
Adagrad optimizer (Adaptive Gradient)
Definition Adagrad.hpp:14

NNFS::Adagrad::Adagrad
Adagrad(double lr, double decay=0.0, double epsilon=1e-7)
Construct a new Adagrad object.
Definition Adagrad.hpp:23

NNFS::Adagrad::update_params
void update_params(std::shared_ptr< Dense > &layer)
Update the parameters of the layer.
Definition Adagrad.hpp:32

NNFS::Optimizer
Base class for all optimizers.
Definition Optimizer.hpp:15

NNFS::Optimizer::_current_lr
double _current_lr
Definition Optimizer.hpp:78

NNFS
Definition Activation.hpp:6