Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Gaussian HMC - integration within cooling gaussians and complexity improvements #301

Closed
wants to merge 5 commits into from
Closed
Show file tree
Hide file tree
Changes from 4 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
113 changes: 113 additions & 0 deletions examples/volume_cooling_gaussians_hmc/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,113 @@
# VolEsti (volume computation and sampling library)
# Copyright (c) 2012-2021 Vissarion Fisikopoulos
# Copyright (c) 2018-2021 Apostolos Chalkis
# Contributed and/or modified by Marios Papachristou, as part of Google Summer of Code 2020 program.
# Licensed under GNU LGPL.3, see LICENCE file

project( VolEsti )


CMAKE_MINIMUM_REQUIRED(VERSION 3.11)

set(CMAKE_ALLOW_LOOSE_LOOP_CONSTRUCTS true)

if(COMMAND cmake_policy)
cmake_policy(SET CMP0003 NEW)
endif(COMMAND cmake_policy)


option(DISABLE_NLP_ORACLES "Disable non-linear oracles (used in collocation)" ON)

if(DISABLE_NLP_ORACLES)
add_definitions(-DDISABLE_NLP_ORACLES)
else()
find_library(IFOPT NAMES libifopt_core.so PATHS /usr/local/lib)
find_library(IFOPT_IPOPT NAMES libifopt_ipopt.so PATHS /usr/local/lib)
find_library(GMP NAMES libgmp.so PATHS /usr/lib/x86_64-linux-gnu /usr/lib/i386-linux-gnu)
find_library(MPSOLVE NAMES libmps.so PATHS /usr/local/lib)
find_library(PTHREAD NAMES libpthread.so PATHS /usr/lib/x86_64-linux-gnu /usr/lib/i386-linux-gnu)
find_library(FFTW3 NAMES libfftw3.so.3 PATHS /usr/lib/x86_64-linux-gnu /usr/lib/i386-linux-gnu)

if (NOT IFOPT)

message(FATAL_ERROR "This program requires the ifopt library, and will not be compiled.")

elseif (NOT GMP)

message(FATAL_ERROR "This program requires the gmp library, and will not be compiled.")

elseif (NOT MPSOLVE)

message(FATAL_ERROR "This program requires the mpsolve library, and will not be compiled.")

elseif (NOT FFTW3)

message(FATAL_ERROR "This program requires the fftw3 library, and will not be compiled.")

else()
message(STATUS "Library ifopt found: ${IFOPT}")
message(STATUS "Library gmp found: ${GMP}")
message(STATUS "Library mpsolve found: ${MPSOLVE}")
message(STATUS "Library fftw3 found:" ${FFTW3})

endif(NOT IFOPT)

endif(DISABLE_NLP_ORACLES)

include("../../external/cmake-files/Eigen.cmake")
GetEigen()

include("../../external/cmake-files/Boost.cmake")
GetBoost()

include("../../external/cmake-files/LPSolve.cmake")
GetLPSolve()

# Find lpsolve library
find_library(LP_SOLVE NAMES liblpsolve55.so PATHS /usr/lib/lp_solve)

if (NOT LP_SOLVE)
message(FATAL_ERROR "This program requires the lp_solve library, and will not be compiled.")
else ()
message(STATUS "Library lp_solve found: ${LP_SOLVE}")

set(CMAKE_EXPORT_COMPILE_COMMANDS "ON")

include_directories (BEFORE ../../external)
vfisikop marked this conversation as resolved.
Show resolved Hide resolved
include_directories (BEFORE ../../external/minimum_ellipsoid)
include_directories (BEFORE ../../include/generators)
include_directories (BEFORE ../../include/volume)
include_directories (BEFORE ../../include)
include_directories (BEFORE ../../include/lp_oracles)
include_directories (BEFORE ../../include/nlp_oracles)
include_directories (BEFORE ../../include/convex_bodies)
include_directories (BEFORE ../../include/random_walks)
include_directories (BEFORE ../../include/annealing)
include_directories (BEFORE ../../include/ode_solvers)
include_directories (BEFORE ../../include/root_finders)
include_directories (BEFORE ../../include/samplers)
include_directories (BEFORE ../../include/misc)
include_directories (BEFORE ../../include/optimization)
include_directories (BEFORE ../../test)

# for Eigen
if (${CMAKE_VERSION} VERSION_LESS "3.12.0")
add_compile_options(-D "EIGEN_NO_DEBUG")
else ()
add_compile_definitions("EIGEN_NO_DEBUG")
endif ()


add_definitions(${CMAKE_CXX_FLAGS} "-std=c++11") # enable C++11 standard
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this is not needed

add_definitions(${CMAKE_CXX_FLAGS} "-O3") # optimization of the compiler
#add_definitions(${CXX_COVERAGE_COMPILE_FLAGS} "-lgsl")
add_definitions(${CXX_COVERAGE_COMPILE_FLAGS} "-lm")
add_definitions(${CXX_COVERAGE_COMPILE_FLAGS} "-ldl")
add_definitions(${CXX_COVERAGE_COMPILE_FLAGS} "-DBOOST_NO_AUTO_PTR")
#add_definitions(${CXX_COVERAGE_COMPILE_FLAGS} "-lgslcblas")
#add_definitions( "-O3 -lgsl -lm -ldl -lgslcblas" )

add_executable (volume_cooling_gaussians_hmc volume_cooling_gaussians_hmc.cpp)
target_link_libraries(volume_cooling_gaussians_hmc ${LP_SOLVE} ${IFOPT} ${IFOPT_IPOPT} ${GMP} ${MPSOLVE} ${PTHREAD} ${FFTW3})

endif()
Original file line number Diff line number Diff line change
@@ -0,0 +1,59 @@
#include "Eigen/Eigen"
#include <vector>
#include "cartesian_geom/cartesian_kernel.h"
#include "hpolytope.h"
#include "known_polytope_generators.h"
#include "random_walks/random_walks.hpp"
#include "volume_sequence_of_balls.hpp"
#include "volume_cooling_gaussians.hpp"
#include "volume_cooling_balls.hpp"

#include <iostream>
#include <fstream>
#include "misc.h"

typedef double NT;
typedef Cartesian<NT> Kernel;
typedef typename Kernel::Point Point;
typedef BoostRandomNumberGenerator<boost::mt19937, NT, 3> RNGType;
typedef HPolytope<Point> HPOLYTOPE;

void calculateAndVerifyVolume(HPOLYTOPE& polytope, const std::string& description, NT expectedVolume, NT epsilon, NT L) {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

We are not very consistent but we use lowercase and "_" for function names.

int walk_len = 200;
NT e = 0.1;

std::cout << "Calculating volume for " << description << ":\n";
NT volume = volume_cooling_gaussians<GaussianHamiltonianMonteCarloExactWalk, RNGType>(polytope, e, walk_len, L);

std::cout << "Estimated volume: " << volume << "\n";
std::cout << "Expected volume: " << expectedVolume << "\n";
NT error = std::abs(volume - expectedVolume);

if (error <= epsilon)
std::cout << "Result is within the acceptable error margin (" << epsilon << ").\n\n";
else
std::cout << "Error (" << error << ") is larger than acceptable margin (" << epsilon << ").\n\n";
}

int main() {
const NT epsilon = 0.1;

// 3-dimensional cube
HPOLYTOPE cube = generate_cube<HPOLYTOPE>(3, false);
calculateAndVerifyVolume(cube, "3-dimensional cube", 1.0, epsilon, 10);

// 3-dimensional cross polytope
HPOLYTOPE crossPolytope = generate_cross<HPOLYTOPE>(3, false);
calculateAndVerifyVolume(crossPolytope, "3-dimensional cross polytope", 4.0 / 6.0, epsilon, 10);

// 3-dimensional simplex
HPOLYTOPE simplex = generate_simplex<HPOLYTOPE>(3, false);
calculateAndVerifyVolume(simplex, "3-dimensional simplex", 1.0 / 6.0, epsilon, 4);

// birkhoff polytope dimension 3
HPOLYTOPE birkhoffPolytope = generate_birkhoff<HPOLYTOPE>(3);
calculateAndVerifyVolume(birkhoffPolytope, "Birkhoff polytope (dim 3)", -1, epsilon, 8); // Theoretical volume not easily available
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Note that the Birkhoff polytope B(3) is not 3-dimensional, but 4-dimensional. In general B(n) is (n-1)^2 dimensional, see https://en.wikipedia.org/wiki/Birkhoff_polytope
Also (theoretical) volumes for n<=10 are available here https://oeis.org/A037302 (could be useful for experiments).


return 0;
}

Original file line number Diff line number Diff line change
Expand Up @@ -224,22 +224,23 @@ private :
}
}

inline void update_position(Point &p, Point &v, NT const& T, NT const& omega)
{
NT C, Phi;
for (size_t i = 0; i < p.dimension(); i++)
{
C = std::sqrt(p[i] * p[i] + (v[i] * v[i]) / (omega * omega));
Phi = std::atan((-v[i]) / (p[i] * omega));
if (v[i] < 0.0 && Phi < 0.0) {
Phi += M_PI;
} else if (v[i] > 0.0 && Phi > 0.0) {
Phi -= M_PI;
}
p.set_coord(i, C * std::cos(omega * T + Phi));
v.set_coord(i, -C * omega * std::sin(omega * T + Phi));
}
inline void update_position(Point& p, Point& v, const NT& T, const NT& omega) {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I think I prefer the constant reference of type T to be written as T const& is there any reason for rewriting as const T&?


NT next_p, next_v;

NT sinVal = std::sin(omega * T);
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this is the trick, thanks, great!

NT cosVal = std::cos(omega * T);

NT factor1 = sinVal / omega;
NT factor2 = -omega * sinVal;

for (size_t i = 0; i < p.dimension(); i++) {
next_p = cosVal * p[i] + v[i] * factor1;
next_v = factor2 * p[i] + cosVal * v[i];

p.set_coord(i, next_p);
v.set_coord(i, next_v);
}
}

inline double get_max_distance(std::vector<Point> &pointset, Point const& q, double &rad)
Expand Down Expand Up @@ -271,5 +272,4 @@ private :
};


#endif // RANDOM_WALKS_GAUSSIAN_HMC_WALK_HPP

#endif // RANDOM_WALKS_GAUSSIAN_HMC_WALK_HPP
89 changes: 50 additions & 39 deletions include/volume/volume_cooling_gaussians.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -20,8 +20,7 @@

#include "cartesian_geom/cartesian_kernel.h"
#include "random_walks/gaussian_helpers.hpp"
#include "random_walks/gaussian_ball_walk.hpp"
#include "random_walks/gaussian_cdhr_walk.hpp"
#include "random_walks/random_walks.hpp"
#include "sampling/random_point_generators.hpp"
#include "volume/math_helpers.hpp"

Expand Down Expand Up @@ -177,10 +176,9 @@ NT get_next_gaussian(Polytope& P,
return last_a * std::pow(ratio, k);
}

// Compute the sequence of spherical gaussians
template
<
typename WalkType,
typename WalkTypePolicy,
typename RandomPointGenerator,
typename Polytope,
typename NT,
Expand All @@ -195,7 +193,9 @@ void compute_annealing_schedule(Polytope& P,
NT const& chebychev_radius,
NT const& error,
std::vector<NT>& a_vals,
RandomNumberGenerator& rng)
RandomNumberGenerator& rng,
typename std::conditional<std::is_same<WalkTypePolicy, GaussianHamiltonianMonteCarloExactWalk>::value,
typename GaussianHamiltonianMonteCarloExactWalk::parameters, void*>::type walk_params = nullptr)
{
typedef typename Polytope::PointType Point;
typedef typename Polytope::VT VT;
Expand All @@ -204,56 +204,53 @@ void compute_annealing_schedule(Polytope& P,
get_first_gaussian(P, frac, chebychev_radius, error, a_vals);

#ifdef VOLESTI_DEBUG
std::cout<<"first gaussian computed\n"<<std::endl;
std::cout << "first gaussian computed\n" << std::endl;
#endif

NT a_stop = 0.0;
const NT tol = 0.001;
unsigned int it = 0;
unsigned int n = P.dimension();
const unsigned int totalSteps = ((int)150/((1.0 - frac) * error))+1;

if (a_vals[0]<a_stop) a_vals[0] = a_stop;
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Why are you removing this check? If the computed (first) gaussian has negative variance then we set it to zero. @TolisChal is this check actually needed?


#ifdef VOLESTI_DEBUG
std::cout<<"Computing the sequence of gaussians..\n"<<std::endl;
#endif
const unsigned int totalSteps = static_cast<unsigned int>(150 / ((1.0 - frac) * error)) + 1;

Point p(n);

while (true)
{
// Compute the next gaussian
NT next_a = get_next_gaussian<RandomPointGenerator>
(P, p, a_vals[it], N, ratio, C, walk_length, rng);
(P, p, a_vals[it], N, ratio, C, walk_length, rng);

#ifdef VOLESTI_DEBUG
std::cout << "Processing a_vals[" << it << "] = " << a_vals[it] << ", next_a = " << next_a << std::endl;
#endif

NT curr_fn = 0;
NT curr_its = 0;
auto steps = totalSteps;

WalkType walk(P, p, a_vals[it], rng);
//TODO: test update delta here?
if constexpr (std::is_same<WalkTypePolicy, GaussianHamiltonianMonteCarloExactWalk>::value) {
GaussianHamiltonianMonteCarloExactWalk::Walk<Polytope, RandomNumberGenerator> walk(P, p, a_vals[it], rng, walk_params);

update_delta<WalkType>
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

why are you removing update_delta?

::apply(walk, 4.0 * chebychev_radius
/ std::sqrt(std::max(NT(1.0), a_vals[it]) * NT(n)));
for (unsigned int j = 0; j < totalSteps; ++j) {
walk.template apply(P, p, a_vals[it], walk_length, rng);
curr_its++;
curr_fn += eval_exp(p, next_a) / eval_exp(p, a_vals[it]);
}
} else {
WalkTypePolicy walk(P, p, a_vals[it], rng);

// Compute some ratios to decide if this is the last gaussian
for (unsigned int j = 0; j < steps; j++)
{
walk.template apply(P, p, a_vals[it], walk_length, rng);
curr_its += 1.0;
curr_fn += eval_exp(p, next_a) / eval_exp(p, a_vals[it]);
for (unsigned int j = 0; j < totalSteps; ++j) {
walk.template apply(P, p, a_vals[it], walk_length, rng);
curr_its++;
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this not an integer, although I do not know the reason (@TolisChal ?)

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Yes, that could be an integer

curr_fn += eval_exp(p, next_a) / eval_exp(p, a_vals[it]);
}
}

// Remove the last gaussian.
// Set the last a_i equal to zero
if (next_a>0 && curr_fn/curr_its>(1.0+tol))
{
// pick the last gaussian
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is the opposite of the last comment, why? It seems that the code indeed remove the last Gaussian (found by that ratio tolerance test) by setting its variance equals to zero.

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I don't see any reason to delete this check. @vgnecula could you please comment on that?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Hmm, I don't know why I modified the comment, as the code seems to do the exact same thing. It probably remained like that from when I was trying to check a bug. Sorry!

if (next_a > 0 && curr_fn / curr_its > (1.0 + tol)) {
a_vals.push_back(next_a);
it++;
} else if (next_a <= 0)
{
} else if (next_a <= 0) {
a_vals.push_back(a_stop);
it++;
break;
Expand All @@ -264,6 +261,8 @@ void compute_annealing_schedule(Polytope& P,
}
}


Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Are those lines needed?


template <typename NT>
struct gaussian_annealing_parameters
{
Expand Down Expand Up @@ -292,7 +291,8 @@ template
double volume_cooling_gaussians(Polytope& Pin,
RandomNumberGenerator& rng,
double const& error = 0.1,
unsigned int const& walk_length = 1)
unsigned int const& walk_length = 1,
double L = -1)
{
typedef typename Polytope::PointType Point;
typedef typename Point::FT NT;
Expand Down Expand Up @@ -335,11 +335,22 @@ double volume_cooling_gaussians(Polytope& Pin,
NT C = parameters.C;
unsigned int N = parameters.N;

compute_annealing_schedule
<
WalkType,
RandomPointGenerator
>(P, ratio, C, parameters.frac, N, walk_length, radius, error, a_vals, rng);
// Construct the necesary parameters if this is the case
// Construct the necessary parameters if this is the case
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

duplicate comment

if constexpr (std::is_same<WalkTypePolicy, GaussianHamiltonianMonteCarloExactWalk>::value) {
if (L > 0) {
typename GaussianHamiltonianMonteCarloExactWalk::parameters walk_params(L, true, 0, false);
compute_annealing_schedule<GaussianHamiltonianMonteCarloExactWalk, RandomPointGenerator>(
P, ratio, C, parameters.frac, N, walk_length, radius, error, a_vals, rng, walk_params);
} else {
compute_annealing_schedule<WalkType, RandomPointGenerator>(
P, ratio, C, parameters.frac, N, walk_length, radius, error, a_vals, rng);
}
} else {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

duplicate code?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

actually, not really. It is just bad indexation. As there is a run time and compile time check (with the L, and the gaussian type policy). If there is a gaussian type walk, I want the walk to check if L>0 or not.

compute_annealing_schedule<WalkType, RandomPointGenerator>(
P, ratio, C, parameters.frac, N, walk_length, radius, error, a_vals, rng);
}


#ifdef VOLESTI_DEBUG
std::cout<<"All the variances of schedule_annealing computed in = "
Expand Down Expand Up @@ -487,4 +498,4 @@ double volume_cooling_gaussians(Polytope &Pin,
return volume_cooling_gaussians<WalkTypePolicy>(Pin, rng, error, walk_length);
}

#endif // VOLUME_COOLING_GAUSSIANS_HPP
#endif // VOLUME_COOLING_GAUSSIANS_HPP
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

please keep the empty ending line