dismecpp/pointwise_8h_source.html

 // Copyright (c) 2021, Aalto University, developed by Erik Schultheis

 // All rights reserved.

 //

 // SPDX-License-Identifier: MIT


 #ifndef DISMEC_POINTWISE_H

 #define DISMEC_POINTWISE_H


 #include "objective.h"

 #include "utils/hash_vector.h"

 #include "utils/throw_error.h"


 namespace dismec::objective {

     template<class CRTP>

     class PointWiseRegularizer : public Objective {

     public:

         explicit PointWiseRegularizer(real_t scale = 1, bool ignore_bias = false);


         [[nodiscard]] long num_variables() const noexcept final { return -1; }


         [[nodiscard]] real_t value_unchecked(const HashVector& location) override;


         void hessian_times_direction_unchecked(const HashVector& location,

                                                const DenseRealVector& direction,

                                                Eigen::Ref<DenseRealVector> target) override;


         void gradient_unchecked(const HashVector& location, Eigen::Ref<DenseRealVector> target) override;


         void gradient_at_zero_unchecked(Eigen::Ref<DenseRealVector> target) override;


         void diag_preconditioner_unchecked(const HashVector& location, Eigen::Ref<DenseRealVector> target) override;


         void project_to_line_unchecked(const HashVector& location, const DenseRealVector& direction) override;

         real_t lookup_on_line(real_t a) override;


         [[nodiscard]] bool dont_regularize_bias() const { return m_LastWeightIsBias; }


         [[nodiscard]] real_t scale() const { return m_Scale; }


     private:

         bool m_LastWeightIsBias = false;

         real_t m_Scale = 1.0;


         DenseRealVector m_LineStart;

         DenseRealVector m_LineDirection;


         [[nodiscard]] real_t point_wise_value_(real_t x) const {

             return static_cast<const CRTP*>(this)->point_wise_value(x);

         }


         [[nodiscard]] real_t point_wise_grad_(real_t x) const {

             return static_cast<const CRTP*>(this)->point_wise_grad(x);

         }


         [[nodiscard]] real_t point_wise_quad_(real_t x) const {

             return static_cast<const CRTP*>(this)->point_wise_quad(x);

         }


         [[nodiscard]] long get_loop_bound(const HashVector& location) const {

             return dont_regularize_bias() ? location->size() - 1u : location->size();

         }

     };


     template<class T>

     PointWiseRegularizer<T>::PointWiseRegularizer(real_t scale, bool ignore_bias) :

         m_LastWeightIsBias(ignore_bias), m_Scale(scale) {

         if(m_Scale < 0) {

             THROW_EXCEPTION(std::logic_error, "Scale must be non-negative");

         }

     }


     template<class T>

     [[nodiscard]] real_t PointWiseRegularizer<T>::value_unchecked(const HashVector& location) {

         /*

          * Here, we just add up the pointwise values, and perform a single rescaling at the end.

          */

         real_t result = 0.0;

         long loop_bound = get_loop_bound(location);

         for (long i = 0; i < loop_bound; ++i) {

             result += point_wise_value_(location->coeff(i));

         }

         return m_Scale * result;

     }


     template<class T>

     void PointWiseRegularizer<T>::hessian_times_direction_unchecked(

             const HashVector& location,

             const DenseRealVector& direction,

             Eigen::Ref<DenseRealVector> target) {


         // the hessian / quadratic approximation is diagonal, so for the matrix-vector product

         // we have to multiply each diagonal component with the corresponding coefficient of the direction.

         long loop_bound = get_loop_bound(location);

         for (long i = 0; i < loop_bound; ++i) {

             target.coeffRef(i) = m_Scale * point_wise_quad_(location->coeff(i)) * direction.coeff(i);

         }


         // if the last weight is interpreted as bias, we make sure that the corresponding target value is set to zero.

         if (dont_regularize_bias())

             target.coeffRef(loop_bound) = real_t{0};

     }


     template<class T>

     void PointWiseRegularizer<T>::gradient_unchecked(const HashVector& location, Eigen::Ref<DenseRealVector> target) {

         long loop_bound = get_loop_bound(location);


         // calculate and fill in the pointwise gradient

         for (long i = 0; i < loop_bound; ++i) {

             target.coeffRef(i) = m_Scale * point_wise_grad_(location->coeff(i));

         }


         // if the last weight is interpreted as bias, we make sure that the corresponding target value is set to zero.

         if (dont_regularize_bias())

             target.coeffRef(target.size() - 1) = real_t{0};

     }


     template<class T>

     void PointWiseRegularizer<T>::gradient_at_zero_unchecked(Eigen::Ref<DenseRealVector> target) {

         // for gradient at zero, we only need to calculate the point-wise gradient once, and can then

         // copy this over the entire vector.

         real_t grad_at_zero = point_wise_grad_(real_t{0});

         target.setConstant(grad_at_zero * m_Scale);


         // if the last weight is interpreted as bias, we make sure that the corresponding target value is set to zero.

         if (dont_regularize_bias())

             target.coeffRef(target.size() - 1) = real_t{0};

     }


     template<class T>

     void PointWiseRegularizer<T>::diag_preconditioner_unchecked(

             const HashVector& location,

             Eigen::Ref<DenseRealVector> target) {

         // same as hessian_times_direction_unchecked, only now we don't multiply by a direction vector

         long loop_bound = get_loop_bound(location);

         for (long i = 0; i < loop_bound; ++i) {

             target.coeffRef(i) = m_Scale * point_wise_quad_(location->coeff(i));

         }


         if (dont_regularize_bias())

             target.coeffRef(target.size() - 1) = real_t{0};

     }


     template<class T>

     void PointWiseRegularizer<T>::project_to_line_unchecked(const HashVector& location, const DenseRealVector& direction) {

         // projecting to line just saves the location and direction for use with the `lookup_on_line` function.

         m_LineStart = location.get();

         m_LineDirection = direction;

     }


     template<class T>

     real_t PointWiseRegularizer<T>::lookup_on_line(real_t a) {

         // The same as value, only using the interpolated positions

         real_t result = 0.0;

         // make sure we sum over the correct subset.

         long loop_bound = dont_regularize_bias() ? m_LineStart.size() - 1u: m_LineStart.size();

         for(long i = 0; i < loop_bound; ++i) {

             result += point_wise_value_(m_LineStart.coeff(i) + a * m_LineDirection.coeff(i));

         }

         return m_Scale * result;

     }


 }


 #endif //DISMEC_POINTWISE_H

dismec::HashVector
An Eigen vector with versioning information, to implement simple caching of results.
Definition: hash_vector.h:43

dismec::HashVector::get
const DenseRealVector & get() const
Gets a constant reference to the data of this vector.
Definition: hash_vector.h:57

dismec::objective::Objective
Class that models an optimization objective.
Definition: objective.h:41

dismec::objective::PointWiseRegularizer
Base class for pointwise regularization functions.
Definition: pointwise.h:39

dismec::objective::PointWiseRegularizer::m_LastWeightIsBias
bool m_LastWeightIsBias
Definition: pointwise.h:72

dismec::objective::PointWiseRegularizer::gradient_at_zero_unchecked
void gradient_at_zero_unchecked(Eigen::Ref< DenseRealVector > target) override
Definition: pointwise.h:157

dismec::objective::PointWiseRegularizer::dont_regularize_bias
bool dont_regularize_bias() const
Definition: pointwise.h:66

dismec::objective::PointWiseRegularizer::hessian_times_direction_unchecked
void hessian_times_direction_unchecked(const HashVector &location, const DenseRealVector &direction, Eigen::Ref< DenseRealVector > target) override
Definition: pointwise.h:125

dismec::objective::PointWiseRegularizer::m_LineDirection
DenseRealVector m_LineDirection
Definition: pointwise.h:80

dismec::objective::PointWiseRegularizer::PointWiseRegularizer
PointWiseRegularizer(real_t scale=1, bool ignore_bias=false)
Definition: pointwise.h:103

dismec::objective::PointWiseRegularizer::point_wise_grad_
real_t point_wise_grad_(real_t x) const
calls point_wise_grad() of the implementing class
Definition: pointwise.h:88

dismec::objective::PointWiseRegularizer::value_unchecked
real_t value_unchecked(const HashVector &location) override
Definition: pointwise.h:112

dismec::objective::PointWiseRegularizer::get_loop_bound
long get_loop_bound(const HashVector &location) const
Definition: pointwise.h:97

dismec::objective::PointWiseRegularizer::diag_preconditioner_unchecked
void diag_preconditioner_unchecked(const HashVector &location, Eigen::Ref< DenseRealVector > target) override
Definition: pointwise.h:169

dismec::objective::PointWiseRegularizer::gradient_unchecked
void gradient_unchecked(const HashVector &location, Eigen::Ref< DenseRealVector > target) override
Definition: pointwise.h:143

dismec::objective::PointWiseRegularizer::point_wise_value_
real_t point_wise_value_(real_t x) const
calls point_wise_value() of the implementing class
Definition: pointwise.h:83

dismec::objective::PointWiseRegularizer::scale
real_t scale() const
Returns the common scale factor for the entire regularizer.
Definition: pointwise.h:69

dismec::objective::PointWiseRegularizer::m_LineStart
DenseRealVector m_LineStart
Definition: pointwise.h:77

dismec::objective::PointWiseRegularizer::lookup_on_line
real_t lookup_on_line(real_t a) override
Looks up the value of the objective on the line defined by the last call to project_to_line().
Definition: pointwise.h:190

dismec::objective::PointWiseRegularizer::project_to_line_unchecked
void project_to_line_unchecked(const HashVector &location, const DenseRealVector &direction) override
Definition: pointwise.h:183

dismec::objective::PointWiseRegularizer::m_Scale
real_t m_Scale
Definition: pointwise.h:73

dismec::objective::PointWiseRegularizer::num_variables
long num_variables() const noexcept final
The pointwise regularizer can act on arbitrarily sized vectors, so num_variables() == -1.
Definition: pointwise.h:47

dismec::objective::PointWiseRegularizer::point_wise_quad_
real_t point_wise_quad_(real_t x) const
calls point_wise_quad() of the implementing class
Definition: pointwise.h:93

hash_vector.h

dismec::objective
Definition: fwd.h:34

dismec::DenseRealVector
types::DenseVector< real_t > DenseRealVector
Any dense, real values vector.
Definition: matrix_types.h:40

dismec::real_t
float real_t
The default type for floating point values.
Definition: config.h:17

objective.h

throw_error.h

THROW_EXCEPTION
#define THROW_EXCEPTION(exception_type,...)
Definition: throw_error.h:16