time-series-regression.py

from __future__ import print_function, division
import multiprocessing
import os
import sys
import gc
import numpy as np
import random
import time
import operator
import math
import matplotlib as mpl
from data import Dataset
import os.path as osp
import shutil
import pandas as pd
mpl.use('agg')
import matplotlib.mlab as mlab
import matplotlib.pyplot as plt
from matplotlib.patches import Polygon
from matplotlib.collections import PatchCollection
from scipy.stats import multivariate_normal
from scipy.stats import norm
import io

class Network:

    def __init__(self, Topo, Train, Test, learn_rate):
        self.Top = Topo  # NN topology [input, hidden, output]
        self.TrainData = Train
        self.TestData = Test
        self.lrate = learn_rate

        self.W1 = np.random.randn(self.Top[0], self.Top[1]) / np.sqrt(self.Top[0])
        self.B1 = np.random.randn(1, self.Top[1]) / np.sqrt(self.Top[1])  # bias first layer
        self.W2 = np.random.randn(self.Top[1], self.Top[2]) / np.sqrt(self.Top[1])
        self.B2 = np.random.randn(1, self.Top[2]) / np.sqrt(self.Top[1])  # bias second layer

        self.hidout = np.zeros((1, self.Top[1]))  # output of first hidden layer
        self.out = np.zeros((1, self.Top[2]))  # output last layer

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sampleEr(self, actualout):
        error = np.subtract(self.out, actualout)
        sqerror = np.sum(np.square(error)) / self.Top[2]
        return sqerror

    def ForwardPass(self, X):
        z1 = X.dot(self.W1) - self.B1
        self.hidout = self.sigmoid(z1)  # output of first hidden layer
        z2 = self.hidout.dot(self.W2) - self.B2
        self.out = self.sigmoid(z2)  # output second hidden layer

    def BackwardPass(self, Input, desired):
        out_delta = (desired - self.out) * (self.out * (1 - self.out))
        hid_delta = out_delta.dot(self.W2.T) * (self.hidout * (1 - self.hidout))

        # self.W2 += (self.hidout.T.dot(out_delta) * self.lrate)
        # self.B2 += (-1 * self.lrate * out_delta)
        # self.W1 += (Input.T.dot(hid_delta) * self.lrate)
        # self.B1 += (-1 * self.lrate * hid_delta)

        layer = 1  # hidden to output
        for x in range(0, self.Top[layer]):
            for y in range(0, self.Top[layer + 1]):
                self.W2[x, y] += self.lrate * out_delta[y] * self.hidout[x]
        for y in range(0, self.Top[layer + 1]):
            self.B2[y] += -1 * self.lrate * out_delta[y]

        layer = 0  # Input to Hidden
        for x in range(0, self.Top[layer]):
            for y in range(0, self.Top[layer + 1]):
                self.W1[x, y] += self.lrate * hid_delta[y] * Input[x]
        for y in range(0, self.Top[layer + 1]):
            self.B1[y] += -1 * self.lrate * hid_delta[y]

    def decode(self, w):
        w_layer1size = self.Top[0] * self.Top[1]
        w_layer2size = self.Top[1] * self.Top[2]

        w_layer1 = w[0:w_layer1size]
        self.W1 = np.reshape(w_layer1, (self.Top[0], self.Top[1]))

        w_layer2 = w[w_layer1size:w_layer1size + w_layer2size]
        self.W2 = np.reshape(w_layer2, (self.Top[1], self.Top[2]))
        self.B1 = w[w_layer1size + w_layer2size:w_layer1size + w_layer2size + self.Top[1]]
        self.B2 = w[w_layer1size + w_layer2size + self.Top[1]:w_layer1size + w_layer2size + self.Top[1] + self.Top[2]]

    def encode(self):
        w1 = self.W1.ravel()
        w2 = self.W2.ravel()
        w = np.concatenate([w1, w2, self.B1, self.B2])
        return w

    def langevin_gradient(self, data, w, depth):  # BP with SGD (Stocastic BP)

        self.decode(w)  # method to decode w into W1, W2, B1, B2.
        size = data.shape[0]

        Input = np.zeros((1, self.Top[0]))  # temp hold input
        Desired = np.zeros((1, self.Top[2]))
        fx = np.zeros(size)

        for i in range(0, depth):
            for i in range(0, size):
                pat = i
                Input = data[pat, 0:self.Top[0]]
                Desired = data[pat, self.Top[0]: self.Top[0] + self.Top[-1]]
                self.ForwardPass(Input)
                self.BackwardPass(Input, Desired)

        w_updated = self.encode()

        return w_updated

    def evaluate_proposal(self, data, w):  # BP with SGD (Stocastic BP)

        self.decode(w)  # method to decode w into W1, W2, B1, B2.
        size = data.shape[0]

        Input = np.zeros((1, self.Top[0]))  # temp hold input
        Desired = np.zeros((1, self.Top[2]))
        fx = np.zeros((size, self.Top[2]))

        for i in range(0, size):  # to see what fx is produced by your current weight update
            Input = data[i, 0:self.Top[0]]
            self.ForwardPass(Input)
            fx[i] = self.out

        return fx

class ptReplica(multiprocessing.Process):

    def __init__(self, use_langevin_gradients, learn_rate, w, minlim_param, maxlim_param, samples, traindata, testdata,
                 topology, burn_in, temperature, swap_interval, langevin_prob, path, parameter_queue, main_process,
                 event):
        # MULTIPROCESSING VARIABLES
        multiprocessing.Process.__init__(self)
        self.processID = temperature
        self.parameter_queue = parameter_queue
        self.signal_main = main_process
        self.event = event

        self.temperature = temperature

        self.adapttemp = temperature
        self.swap_interval = swap_interval
        self.path = path
        self.burn_in = burn_in
        # FNN CHAIN VARIABLES (MCMC)
        self.samples = samples
        self.topology = topology
        self.traindata = traindata
        self.testdata = testdata
        self.w = w

        self.minY = np.zeros((1, 1))
        self.maxY = np.zeros((1, 1))

        self.minlim_param = minlim_param
        self.maxlim_param = maxlim_param

        self.use_langevin_gradients = use_langevin_gradients

        self.sgd_depth = 1  # always should be 1

        self.learn_rate = learn_rate

        self.l_prob = langevin_prob  # can be evaluated for diff problems - if data too large keep this low value since the gradients cost comp time

        self.w_size = 0

    def rmse(self, pred, actual):
        return np.sqrt((np.square(pred - actual)).mean())

    def rmse_per_output(self, pred, actual):
        individual_rmse = np.zeros(self.topology[2])
        for i in range(0, self.topology[2]):
            individual_rmse[i] = np.sqrt(np.square(pred[:, i] - actual[:, i]).mean())
        return individual_rmse

    def mae(self, pred, actual):
        return np.abs(pred - actual).mean()

    def mape(self, pred, actual):
        return 100 * np.abs((pred - actual) / (actual+0.000001)).mean()

    '''def likelihood_func(self, fnn, data, w): # multinomial lhood in case of classification problem
        y = data[:, self.topology[0]]
        fx  = fnn.evaluate_proposal(data,w)
        rmse = self.rmse(fx,y)
        z = np.zeros((data.shape[0],self.topology[2]))
        lhood = 0
        for i in range(data.shape[0]):
            for j in range(self.topology[2]):
                if j == y[i]:
                    z[i,j] = 1
                lhood += z[i,j]*np.log(prob[i,j])
  

        return [lhood/self.temperature, fx, rmse]'''

    def likelihood_func(self, fnn, data, w, tau_sq):
        y = data[:, self.topology[0]: self.topology[0] + self.topology[-1]]
        fx = fnn.evaluate_proposal(data, w)
        #rmse = self.rmse(fx, y) 
        indi_rmse = self.rmse_per_output(fx, y)
        rmse = np.mean(indi_rmse)

        mae = self.mae(fx, y)
        mape = self.mape(fx, y)
 
        n = (y.shape[0] * y.shape[1]) # number of samples x number of outputs (prediction horizon)
        
        p1 = - (n/2) * np.log(2 * math.pi * tau_sq) 
        p2 =  (1/2*tau_sq) 
        
        log_lhood =  p1 - (p2 *  np.sum(np.square(y- fx)) )

        return [ log_lhood / self.adapttemp, fx, rmse, indi_rmse, mae, mape]

    '''def prior_likelihood(self, sigma_squared, nu_1, nu_2, w):
        h = self.topology[1]  # number hidden neurons
        d = self.topology[0]  # number input neurons
        part1 = -1 * ((d * h + h + self.topology[2]+h*self.topology[2]) / 2) * np.log(sigma_squared)
        part2 = 1 / (2 * sigma_squared) * (sum(np.square(w)))
        log_loss = part1 - part2
        return log_loss'''

    def prior_likelihood(self, sigma_squared, nu_1, nu_2, w, tausq):
        h = self.topology[1]  # number hidden neurons
        d = self.topology[0]  # number input neurons
        part1 = -1 * ((d * h + h + 2) / 2) * np.log(sigma_squared)
        part2 = 1 / (2 * sigma_squared) * (sum(np.square(w)))
        log_loss = part1 - part2 - (1 + nu_1) * np.log(tausq) - (nu_2 / tausq)
        return log_loss

    def run(self):
        # INITIALISING FOR FNN
        testsize = self.testdata.shape[0]
        trainsize = self.traindata.shape[0]
        samples = self.samples
        x_test = np.linspace(0, 1, num=testsize)
        x_train = np.linspace(0, 1, num=trainsize)
        netw = self.topology
        y_test = self.testdata[:, netw[0]: netw[0] + netw[-1]]
        y_train = self.traindata[:, netw[0]: netw[0] + netw[-1]]

        batch_save = 10  # batch to append to file

        w_size = (netw[0] * netw[1]) + (netw[1] * netw[2]) + netw[1] + netw[2]  # num of weights and bias
        self.w_size = w_size
        pos_w = np.ones((samples, w_size))  # Posterior for all weights
        # pos_w = np.ones((samples, w_size)) #Posterior for all weights
        lhood_list = np.zeros((samples, 1))
        surrogate_list = np.zeros((samples, 1))
        # fxtrain_samples = np.ones((batch_save, trainsize)) #Output of regression FNN for training samples
        # fxtest_samples = np.ones((batch_save, testsize)) #Output of regression FNN for testing samples
        fxtrain_samples = np.ones((samples, trainsize, netw[2]))
        fxtest_samples = np.ones((samples, testsize, netw[2]))
        rmse_train = np.zeros(samples)
        indi_rmse_train = np.zeros((samples, netw[2]))
        mae_train = np.zeros(samples)
        mape_train = np.zeros(samples)

        rmse_test = np.zeros(samples)
        indi_rmse_test = np.zeros((samples, netw[2]))
        mae_test = np.zeros(samples)
        mape_test = np.zeros(samples)

        acc_train = np.zeros(samples)
        acc_test = np.zeros(samples)
        learn_rate = self.learn_rate

        # Random Initialisation of weights
        w = self.w
        eta = 0  # Junk variable
        # print(w,self.temperature)
        w_proposal = np.random.randn(w_size)
        # Randomwalk Steps
        step_w = 0.025 # 0.025 used in paper - this is the standard deviation of the Gausian random-walk proposal distribution for weights and biases

        step_eta = 0.2 # for tau_sq (single value) random walk proposal distribution  that captures the noise in predictions
        # Declare FNN
        fnn = Network(self.topology, self.traindata, self.testdata, learn_rate)

        print(self.topology, ' topo')
        # Evaluate Proposals
        pred_train = fnn.evaluate_proposal(self.traindata, w)  #
        pred_test = fnn.evaluate_proposal(self.testdata, w)  #
        # Check Variance of Proposal

        eta = np.log(np.var(pred_train - y_train))
        tau_pro = np.exp(eta)

        sigma_squared = 25
        nu_1 = 0
        nu_2 = 0
        sigma_diagmat = np.zeros((w_size, w_size))  # for Equation 9 in Ref [Chandra_ICONIP2017]
        np.fill_diagonal(sigma_diagmat, step_w)

        delta_likelihood = 0.5  # an arbitrary position
        prior_current = self.prior_likelihood(sigma_squared, nu_1, nu_2, w, tau_pro)  # takes care of the gradients

        [likelihood, pred_train, rmsetrain, indi_rmsetrain, maetrain, mapetrain] = self.likelihood_func(fnn, self.traindata, w, tau_pro)
        [_, pred_test, rmsetest, indi_rmsetest, maetest, mapetest] = self.likelihood_func(fnn, self.testdata, w, tau_pro)

        plt.plot(x_train, y_train)
        plt.plot(x_train, pred_train)
        plt.title('plot of data vs initial fx')
        file_name = self.path + '/predictions/begin_chain_' + str(self.temperature) + '.png'
        plt.savefig(file_name)

        plt.plot(x_train, y_train)

        trainacc = 0
        testacc = 0

        prop_list = np.zeros((samples, w_proposal.size))
        likeh_list = np.zeros((samples, 2))  # one for posterior of likelihood and the other for all proposed likelihood
        likeh_list[0, :] = [-100, -100]  # to avoid prob in calc of 5th and 95th percentile later
        surg_likeh_list = np.zeros((samples, 2))
        accept_list = np.zeros(samples)

        num_accepted = 0

        langevin_count = 0

        pt_samples = samples * 0.6
        # this means that PT in canonical form with adaptive temp will work till pt  samples are reached

        init_count = 0

        self.event.clear()

        for i in range(samples - 1):
            # Begin sampling

            timer1 = time.time()

            if i < pt_samples:
                self.adapttemp = self.temperature  # * ratio  #

            if i == pt_samples and init_count == 0:  # move to MCMC canonical
                self.adapttemp = 1
                [likelihood, pred_train, rmsetrain, indi_rmsetrain, maetrain, mapetrain] = self.likelihood_func(fnn, self.traindata, w,
                                                                                                tau_pro)
                [_, pred_test, rmsetest, indi_rmsetest, maetest, mapetest] = self.likelihood_func(fnn, self.testdata, w, tau_pro)
                init_count = 1

            lx = np.random.uniform(0, 1, 1)

            if (self.use_langevin_gradients is True) and (lx < self.l_prob):
                w_gd = fnn.langevin_gradient(self.traindata, w.copy(), self.sgd_depth)  # Eq 8
                w_proposal = np.random.normal(w_gd, step_w, w_size)  # Eq 7
                w_prop_gd = fnn.langevin_gradient(self.traindata, w_proposal.copy(), self.sgd_depth)
                # first = np.log(multivariate_normal.pdf(w , w_prop_gd , sigma_diagmat))
                # second = np.log(multivariate_normal.pdf(w_proposal , w_gd , sigma_diagmat)) # this gives numerical instability - hence we give a simple implementation next that takes out log

                wc_delta = (w - w_prop_gd)
                wp_delta = (w_proposal - w_gd)

                sigma_sq = (step_w * step_w ) #this is the variance (originally this was a bug where  sigma_sq = step_w)

                first = -0.5 * np.sum(wc_delta * wc_delta) / sigma_sq  # this is wc_delta.T  *  wc_delta /sigma_sq
                second = -0.5 * np.sum(wp_delta * wp_delta) / sigma_sq

                scaling_factor = 0.25 # this is to ensure that high quality samples are accepted

                diff_prop = first - second 
                diff_prop = diff_prop * scaling_factor  / self.adapttemp

                diff_prop = diff_prop * scaling_factor  / self.adapttemp
                langevin_count = langevin_count + 1
            else:
                diff_prop = 0
                w_proposal = np.random.normal(w, step_w, w_size)

            eta_pro = eta + np.random.normal(0, step_eta, 1)
            tau_pro = math.exp(eta_pro)

            [likelihood_proposal, pred_train, rmsetrain, indi_rmsetrain, maetrain, mapetrain] \
                = self.likelihood_func(fnn, self.traindata, w_proposal,
                                       tau_pro)

            [_, pred_test, rmsetest, indi_rmsetest, maetest, mapetest] \
                = self.likelihood_func(fnn, self.testdata, w_proposal, tau_pro)

            prior_prop = self.prior_likelihood(sigma_squared, nu_1, nu_2, w_proposal,
                                               tau_pro)  # takes care of the gradients
            diff_prior = prior_prop - prior_current
            diff_likelihood = likelihood_proposal - likelihood

            surg_likeh_list[i + 1, 0] = likelihood_proposal * self.adapttemp
            # surg_likeh_list[i+1,1] = np.nan

            try:
                mh_prob = min(1, math.exp(diff_likelihood + diff_prior + diff_prop))
            except OverflowError as e:
                mh_prob = 1

            accept_list[i + 1] = num_accepted

            if (i % batch_save + 1) == 0:  # just for saving posterior to file - work on this later
                x = 0

            u = random.uniform(0, 1)

            prop_list[i + 1] = w_proposal
            likeh_list[i + 1, 0] = likelihood_proposal

            if u < mh_prob:
                num_accepted = num_accepted + 1
                likelihood = likelihood_proposal
                prior_current = prior_prop
                w = w_proposal

                eta = eta_pro

                acc_train[i + 1] = 0
                acc_test[i + 1] = 0

                print (i, langevin_count, num_accepted, self.adapttemp, diff_prop ,  likelihood, rmsetrain, rmsetest  , 'accepted')

                pos_w[i + 1] = w_proposal

                fxtrain_samples[i + 1] = pred_train
                fxtest_samples[i + 1] = pred_test
                rmse_train[i + 1] = rmsetrain
                rmse_test[i + 1] = rmsetest
                indi_rmse_train[i + 1] = indi_rmsetrain
                indi_rmse_test[i + 1] = indi_rmsetest
                mae_train[i + 1] = maetrain
                mae_test[i + 1] = maetest
                mape_train[i + 1] = mapetrain
                mape_test[i + 1] = mapetest
                # x = x + 1

            else:
                pos_w[i + 1] = pos_w[i]
                fxtrain_samples[i + 1] = fxtrain_samples[i,]
                fxtest_samples[i + 1] = fxtest_samples[i,]
                rmse_train[i + 1] = rmse_train[i]
                rmse_test[i + 1] = rmse_test[i]
                indi_rmse_train[i + 1] = indi_rmse_train[i]
                indi_rmse_test[i + 1] = indi_rmse_test[i]
                acc_train[i + 1] = acc_train[i]
                acc_test[i + 1] = acc_test[i]
                mae_train[i + 1] = mae_train[i]
                mae_test[i + 1] = mae_test[i]
                mape_train[i + 1] = mape_train[i]
                mape_test[i + 1] = mape_test[i]

            if i % self.swap_interval == 0 and i != 0:
                #print(i)
                # print('\nTemperature: {} Swapping weights: {}'.format(self.temperature, w[:2]))
                param = np.concatenate([w, np.asarray([eta]).reshape(1), np.asarray([likelihood * self.temperature]),
                                        np.asarray([self.temperature])])
                self.parameter_queue.put(param)
                self.signal_main.set()
                self.event.clear()
                self.event.wait()
                result = self.parameter_queue.get()
                w = result[0:self.w_size]
                eta = result[self.w_size]
                # likelihood1 = result[self.w_size+1]/self.temperature

        param = np.concatenate(
            [w, np.asarray([eta]).reshape(1), np.asarray([likelihood]), np.asarray([self.adapttemp]), np.asarray([i])])

        self.parameter_queue.put(param)

        print((num_accepted * 100 / (samples * 1.0)), '% was accepted')
        accept_ratio = num_accepted / (samples * 1.0) * 100

        print((langevin_count * 100 / (samples * 1.0)), '% was Lsnngrevin ')
        langevin_ratio = langevin_count / (samples * 1.0) * 100

        file_name = self.path + '/posterior/pos_w/' + 'chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, pos_w)

        file_name = self.path + '/predictions/fxtrain_samples_chain_' + str(self.temperature) + '.npy'
        np.save(file_name, fxtrain_samples)
        file_name = self.path + '/predictions/fxtest_samples_chain_' + str(self.temperature) + '.npy'
        np.save(file_name, fxtest_samples)
        file_name = self.path + '/predictions/rmse_test_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, rmse_test, fmt='%1.8f')
        file_name = self.path + '/predictions/rmse_train_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, rmse_train, fmt='%1.8f')

        file_name = self.path + '/predictions/indi_rmse_train_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, indi_rmse_train, fmt='%1.8f')
        file_name = self.path + '/predictions/indi_rmse_test_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, indi_rmse_test, fmt='%1.8f')

        file_name = self.path + '/predictions/mae_test_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, mae_test, fmt='%1.8f')
        file_name = self.path + '/predictions/mae_train_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, mae_train, fmt='%1.8f')
        file_name = self.path + '/predictions/mape_test_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, mape_test, fmt='%1.8f')
        file_name = self.path + '/predictions/mape_train_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, mape_train, fmt='%1.8f')

        file_name = self.path + '/predictions/acc_test_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, acc_test, fmt='%1.2f')
        file_name = self.path + '/predictions/acc_train_chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, acc_train, fmt='%1.2f')

        file_name = self.path + '/posterior/pos_likelihood/chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, likeh_list, fmt='%1.4f')

        file_name = self.path + '/posterior/accept_list/chain_' + str(self.temperature) + '_accept.txt'
        np.savetxt(file_name, [accept_ratio], fmt='%1.4f')

        file_name = self.path + '/posterior/accept_list/chain_' + str(self.temperature) + '.txt'
        np.savetxt(file_name, accept_list, fmt='%1.4f')

        self.signal_main.set()


class ParallelTempering:
    def __init__(self, use_langevin_gradients, learn_rate, traindata, testdata, topology, num_chains, maxtemp,
                 NumSample, swap_interval, langevin_prob, path):
        # FNN Chain variables
        self.traindata = traindata
        self.testdata = testdata
        self.topology = topology
        self.num_param = (topology[0] * topology[1]) + (topology[1] * topology[2]) + topology[1] + topology[2]
        # Parallel Tempering variables
        self.swap_interval = swap_interval
        self.path = path
        self.maxtemp = maxtemp

        self.langevin_prob = langevin_prob
        self.num_swap = 0
        self.total_swap_proposals = 0
        self.num_chains = num_chains
        self.chains = []
        self.temperatures = []
        self.NumSamples = int(NumSample / self.num_chains)
        self.sub_sample_size = max(1, int(0.05 * self.NumSamples))
        # create queues for transfer of parameters between process chain
        self.parameter_queue = [multiprocessing.Queue() for i in range(num_chains)]
        self.chain_queue = multiprocessing.JoinableQueue()
        self.wait_chain = [multiprocessing.Event() for i in range(self.num_chains)]
        self.event = [multiprocessing.Event() for i in range(self.num_chains)]

        self.all_param = None
        self.geometric = True  # True (geometric)  False (Linear)

        self.minlim_param = 0.0
        self.maxlim_param = 0.0
        self.minY = np.zeros((1, 1))
        self.maxY = np.ones((1, 1))

        self.model_signature = 0.0

        self.learn_rate = learn_rate

        self.use_langevin_gradients = use_langevin_gradients

    def default_beta_ladder(self, ndim, ntemps,
                            Tmax):   

        if type(ndim) != int or ndim < 1:
            raise ValueError('Invalid number of dimensions specified.')
        if ntemps is None and Tmax is None:
            raise ValueError('Must specify one of ``ntemps`` and ``Tmax``.')
        if Tmax is not None and Tmax <= 1:
            raise ValueError('``Tmax`` must be greater than 1.')
        if ntemps is not None and (type(ntemps) != int or ntemps < 1):
            raise ValueError('Invalid number of temperatures specified.')
 

        maxtemp = Tmax
        numchain = ntemps
        b = []
        b.append(maxtemp)
        last = maxtemp
        for i in range(maxtemp):
            last = last * (numchain ** (-1 / (numchain - 1)))
            b.append(last)
        tstep = np.array(b)

        if ndim > tstep.shape[0]:
            # An approximation to the temperature step at large
            # dimension
            tstep = 1.0 + 2.0 * np.sqrt(np.log(4.0)) / np.sqrt(ndim)
        else:
            tstep = tstep[ndim - 1]

        appendInf = False
        if Tmax == np.inf:
            appendInf = True
            Tmax = None
            ntemps = ntemps - 1

        if ntemps is not None:
            if Tmax is None:
                # Determine Tmax from ntemps.
                Tmax = tstep ** (ntemps - 1)
        else:
            if Tmax is None:
                raise ValueError('Must specify at least one of ``ntemps'' and '
                                 'finite ``Tmax``.')

            # Determine ntemps from Tmax.
            ntemps = int(np.log(Tmax) / np.log(tstep) + 2)

        betas = np.logspace(0, -np.log10(Tmax), ntemps)
        if appendInf:
            # Use a geometric spacing, but replace the top-most temperature with
            # infinity.
            betas = np.concatenate((betas, [0]))

        return betas

    def assign_temperatures(self):
        # #Linear Spacing
        # temp = 2
        # for i in range(0,self.num_chains):
        #     self.temperatures.append(temp)
        #     temp += 2.5 #(self.maxtemp/self.num_chains)
        #     print (self.temperatures[i])
        # Geometric Spacing

        if self.geometric == True:
            betas = self.default_beta_ladder(2, ntemps=self.num_chains, Tmax=self.maxtemp)
            for i in range(0, self.num_chains):
                self.temperatures.append(np.inf if betas[i] is 0 else 1.0 / betas[i])
                print(self.temperatures[i])
        else:

            tmpr_rate = (self.maxtemp / self.num_chains)
            temp = 1
            for i in range(0, self.num_chains):
                self.temperatures.append(temp)
                temp += tmpr_rate
                print(self.temperatures[i])

    def initialize_chains(self, burn_in):
        self.burn_in = burn_in
        self.assign_temperatures()
        self.minlim_param = np.repeat([-100], self.num_param)  # priors for nn weights
        self.maxlim_param = np.repeat([100], self.num_param)

        for i in range(0, self.num_chains):
            w = np.random.randn(self.num_param)
            self.chains.append(
                ptReplica(self.use_langevin_gradients, self.learn_rate, w, self.minlim_param, self.maxlim_param,
                          self.NumSamples, self.traindata, self.testdata, self.topology, self.burn_in,
                          self.temperatures[i], self.swap_interval, self.langevin_prob, self.path,
                          self.parameter_queue[i], self.wait_chain[i], self.event[i]))

    def surr_procedure(self, queue):

        if queue.empty() is False:
            return queue.get()
        else:
            return

    def swap_procedure(self, parameter_queue_1, parameter_queue_2):
        # if parameter_queue_2.empty() is False and parameter_queue_1.empty() is False:
        param1 = parameter_queue_1.get()
        param2 = parameter_queue_2.get()
        w1 = param1[0:self.num_param]
        eta1 = param1[self.num_param]
        lhood1 = param1[self.num_param + 1]
        T1 = param1[self.num_param + 2]
        w2 = param2[0:self.num_param]
        eta2 = param2[self.num_param]
        lhood2 = param2[self.num_param + 1]
        T2 = param2[self.num_param + 2]
        # print('yo')
        # SWAPPING PROBABILITIES
        try:
            swap_proposal = min(1, 0.5 * np.exp(min(709, lhood2 - lhood1)))
        except OverflowError:
            swap_proposal = 1
        u = np.random.uniform(0, 1)
        swapped = False
        if u < swap_proposal:
            self.total_swap_proposals += 1
            self.num_swap += 1
            param_temp = param1
            param1 = param2
            param2 = param_temp
            swapped = True
        else:
            swapped = False
            self.total_swap_proposals += 1

        return param1, param2, swapped

    def run_chains(self):
        # only adjacent chains can be swapped therefore, the number of proposals is ONE less num_chains
        swap_proposal = np.ones(self.num_chains - 1)
        # create parameter holders for paramaters that will be swapped
        replica_param = np.zeros((self.num_chains, self.num_param))
        lhood = np.zeros(self.num_chains)
        # Define the starting and ending of MCMC Chains
        start = 0
        end = self.NumSamples - 1
        number_exchange = np.zeros(self.num_chains)
        filen = open(self.path + '/num_exchange.txt', 'a')
        # RUN MCMC CHAINS
        for l in range(0, self.num_chains):
            self.chains[l].start_chain = start
            self.chains[l].end = end
        for j in range(0, self.num_chains):
            self.wait_chain[j].clear()
            self.event[j].clear()
            self.chains[j].start()
        # SWAP PROCEDURE

        swaps_appected_main = 0
        total_swaps_main = 0

        for i in range(int(self.NumSamples / self.swap_interval)):
            count = 0
            for index in range(self.num_chains):
                if not self.chains[index].is_alive():
                    count += 1
                    #print(str(self.chains[index].temperature) + " Dead")
                    self.wait_chain[index].set()
            if count == self.num_chains:
                break
            #print("Waiting")
            timeout_count = 0
            for index in range(0, self.num_chains):
                #print("Waiting for chain: {}".format(index + 1))
                flag = self.wait_chain[index].wait()
                if flag:
                    #print("Signal from chain: {}".format(index + 1))
                    timeout_count += 1

            if timeout_count != self.num_chains:
                #print("Skipping the swap!")
                continue
            #print("Event occured")
            for index in range(0, self.num_chains - 1):
                param_1, param_2, swapped = self.swap_procedure(self.parameter_queue[index],
                                                                self.parameter_queue[index + 1])
                self.parameter_queue[index].put(param_1)
                self.parameter_queue[index + 1].put(param_2)
                if index == 0:
                    if swapped:
                        swaps_appected_main += 1
                    total_swaps_main += 1

            for index in range(self.num_chains):
                self.event[index].set()
                self.wait_chain[index].clear()

        print("Joining processes")

        # JOIN THEM TO MAIN PROCESS
        for index in range(0, self.num_chains):
            self.chains[index].join()
        self.chain_queue.join()

        pos_w, fx_train, fx_test, rmse_train, rmse_test, indi_rmse_train, indi_rmse_test, mae_train, mae_test, mape_train, mape_test, \
        acc_train, acc_test, likelihood_vec, accept_vec, accept , fx_test_all = self.show_results()

        print("NUMBER OF SWAPS =", self.num_swap)
        swap_perc = self.num_swap * 100 / self.total_swap_proposals
        return pos_w, fx_train, fx_test, rmse_train, rmse_test, indi_rmse_train, indi_rmse_test, mae_train, mae_test, mape_train, \
               mape_test, acc_train, acc_test, likelihood_vec, swap_perc, accept_vec, accept, fx_test_all

    def show_results(self):

        burnin = int(self.NumSamples * self.burn_in)

        likelihood_rep = np.zeros((self.num_chains, self.NumSamples - 1,
                                   2))
        # index 1 for likelihood posterior and index 0 for Likelihood proposals.
        # Note all likilihood proposals plotted only
        accept_percent = np.zeros((self.num_chains, 1))
        accept_list = np.zeros((self.num_chains, self.NumSamples))

        pos_w = np.zeros((self.num_chains, self.NumSamples - burnin, self.num_param))

        fx_train_all = np.zeros((self.NumSamples - burnin, self.traindata.shape[0], self.topology[-1]))
        # rmse_train = np.zeros((self.num_chains, self.NumSamples - burnin))
        # mae_train = np.zeros((self.num_chains, self.NumSamples - burnin))
        # mape_train = np.zeros((self.num_chains, self.NumSamples - burnin))
        rmse_train = np.zeros((self.num_chains, self.NumSamples))
        indi_rmse_train = np.zeros((self.num_chains, self.NumSamples, self.topology[2]))
        mae_train = np.zeros((self.num_chains, self.NumSamples))
        mape_train = np.zeros((self.num_chains, self.NumSamples))

        acc_train = np.zeros((self.num_chains, self.NumSamples - burnin))
        fx_test_all = np.zeros((self.NumSamples - burnin, self.testdata.shape[0], self.topology[-1]))
        # rmse_test = np.zeros((self.num_chains, self.NumSamples - burnin))
        # mae_test = np.zeros((self.num_chains, self.NumSamples - burnin))
        # mape_test = np.zeros((self.num_chains, self.NumSamples - burnin))
        rmse_test = np.zeros((self.num_chains, self.NumSamples))
        indi_rmse_test = np.zeros((self.num_chains, self.NumSamples, self.topology[2]))
        mae_test = np.zeros((self.num_chains, self.NumSamples))
        mape_test = np.zeros((self.num_chains, self.NumSamples))

        acc_test = np.zeros((self.num_chains, self.NumSamples - burnin))
        # train_pred = np.zeros((self.traindata.shape[0], self.topology[-1]))
        # test_pred = np.zeros((self.testdata.shape[0], self.topology[-1]))

        for i in range(self.num_chains):
            file_name = self.path + '/posterior/pos_w/' + 'chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            pos_w[i, :, :] = dat[burnin:, :]

            file_name = self.path + '/posterior/pos_likelihood/' + 'chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            likelihood_rep[i, :] = dat[1:]

            file_name = self.path + '/posterior/accept_list/' + 'chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            accept_list[i, :] = dat

            file_name = self.path + '/predictions/fxtrain_samples_chain_' + str(self.temperatures[i]) + '.npy'
            dat = np.load(file_name)
            fx_train_all += dat[burnin:]

            file_name = self.path + '/predictions/fxtest_samples_chain_' + str(self.temperatures[i]) + '.npy'
            dat = np.load(file_name)
            # fx_test_all[i,:,:] = dat[burnin:,:]
            fx_test_all += dat[burnin:]

            file_name = self.path + '/predictions/rmse_test_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            # rmse_test[i, :] = dat[burnin:]
            rmse_test[i, :] = dat

            file_name = self.path + '/predictions/rmse_train_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            rmse_train[i, :] = dat
            # rmse_train[i, :] = dat[burnin:]

            file_name = self.path + '/predictions/indi_rmse_test_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            # rmse_test[i, :] = dat[burnin:]
            indi_rmse_test[i, :] = dat.reshape((dat.shape[0], self.topology[2]))

            file_name = self.path + '/predictions/indi_rmse_train_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            # rmse_test[i, :] = dat[burnin:]
            indi_rmse_train[i, :] = dat.reshape((dat.shape[0], self.topology[2]))

            file_name = self.path + '/predictions/mae_test_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            mae_test[i, :] = dat

            file_name = self.path + '/predictions/mae_train_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            mae_train[i, :] = dat

            file_name = self.path + '/predictions/mape_test_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            mape_test[i, :] = dat

            file_name = self.path + '/predictions/mape_train_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            mape_train[i, :] = dat

            file_name = self.path + '/predictions/acc_test_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            acc_test[i, :] = dat[burnin:]

            file_name = self.path + '/predictions/acc_train_chain_' + str(self.temperatures[i]) + '.txt'
            dat = np.loadtxt(file_name)
            acc_train[i, :] = dat[burnin:]

        posterior = pos_w.transpose(2, 0, 1).reshape(self.num_param, -1)
        #
        # fx_train = fx_test_all.mean()  # need to comment this if need to save memory
        # fx_test = fx_test_all.transpose(2, 0, 1).reshape(self.testdata.shape[0], -1)
        fx_train_all /= self.num_chains
        fx_test_all /= self.num_chains
        fx_train = fx_train_all.mean(axis=0)
        fx_test = fx_test_all.mean(axis=0)
        # fx_test = fxtest_samples.reshape(self.num_chains*(self.NumSamples - burnin), self.testdata.shape[0]) # konarks version

        likelihood_vec = likelihood_rep.transpose(2, 0, 1).reshape(2, -1)

        # rmse_train = rmse_train.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # mae_train = mae_train.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # mape_train = mape_train.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # acc_train = acc_train.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # rmse_test = rmse_test.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # mae_test = rmse_test.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # mape_test = rmse_test.reshape(self.num_chains * (self.NumSamples - burnin), 1)
        # acc_test = acc_test.reshape(self.num_chains * (self.NumSamples - burnin), 1)

        rmse_train = rmse_train.mean(axis=0)
        indi_rmse_train = indi_rmse_train.mean(axis=0)
        mae_train = mae_train.mean(axis=0)
        mape_train = mape_train.mean(axis=0)
        acc_train = acc_train.mean(axis=0)
        rmse_test = rmse_test.mean(axis=0)
        indi_rmse_test = indi_rmse_test.mean(axis=0)
        mae_test = mae_test.mean(axis=0)
        mape_test = mape_test.mean(axis=0)
        acc_test = acc_test.mean(axis=0)

        accept_vec = accept_list

        print(accept_vec)

        accept = np.sum(accept_percent) / self.num_chains

        # np.savetxt(self.path + '/pos_param.txt', posterior.T)  # tcoment to save space

        np.savetxt(self.path + '/likelihood.txt', likelihood_vec.T, fmt='%1.5f')

        np.savetxt(self.path + '/accept_list.txt', accept_list, fmt='%1.2f')

        np.savetxt(self.path + '/acceptpercent.txt', [accept], fmt='%1.2f')

        np.savetxt(self.path + '/rmse_train.txt', rmse_train, fmt='%1.5f')
        np.savetxt(self.path + '/rmse_test.txt', rmse_test, fmt='%1.5f')
        np.savetxt(self.path + '/indi_rmse_train.txt', indi_rmse_train, fmt='%1.5f')
        np.savetxt(self.path + '/indi_rmse_test.txt', indi_rmse_test, fmt='%1.5f')
        np.savetxt(self.path + '/mae_train.txt', mae_train, fmt='%1.5f')
        np.savetxt(self.path + '/mae_test.txt', mae_test, fmt='%1.5f')
        np.savetxt(self.path + '/mape_train.txt', mape_train, fmt='%1.5f')
        np.savetxt(self.path + '/mape_test.txt', mape_test, fmt='%1.5f')
        return posterior, fx_train, fx_test, rmse_train, rmse_test, indi_rmse_train, indi_rmse_test, \
               mae_train, mae_test, mape_train, mape_test, acc_train, acc_test, likelihood_vec.T, \
               accept_vec, accept, fx_test_all

    def make_directory(self, directory):
        if not os.path.exists(directory):
            os.makedirs(directory)


def main():


    name = 'MMM8'


    #for d in os.listdir('./datasets/raw'):
    #   if osp.isfile(osp.join('datasets/raw', d)):
    #       name = osp.splitext(d)[0]

        

        #dataset = Dataset(name, 0.8, 5, 1, 5, 2, overwrite=False)

    


    #traindata = np.asarray(dataset.train)


    #testdata = np.asarray(dataset.test)

    
    raw_data = pd.read_csv('./datasets/raw/MMM.csv')['Close']
    raw_min = raw_data.min()
    raw_max = raw_data.max()
    data = raw_data.apply(lambda x: (x - raw_data.min()) / (raw_data.max() - raw_data.min()))
 
    #print(raw_data)
    #print(data) 

    traindata = np.genfromtxt('./datasets/MMM8_train.txt', delimiter = ' ') # scaled between 0,1 for sigmoid fuunction in output layer
    testdata = np.genfromtxt('./datasets/MMM8_test.txt', delimiter = ' ')

    print(traindata.shape)

    hidden = 10 # 5 used in paper
    ip = 5
    output = 5

    NumSample = 10000 # 100000 is used in the paper but 10000 gives similar results.

    topology = [ip, hidden, output]

    netw = topology

    y_test = testdata[:, netw[0]: netw[0] + netw[-1]]
    y_train = traindata[:, netw[0]: netw[0] + netw[-1]]

    maxtemp = 2 #  5 is used in the paper 
    #swap_ratio = 0.01  #
    num_chains = 8  # 10 used in paper
    swap_interval = 5 # int(swap_ratio * NumSample / num_chains)  #how ofen you swap neighbours. note if swap is more than Num_samples, its off
    burn_in = 0.5  #

    learn_rate = 0.05 # 0.1 used in paper  # in case langevin gradients are used. Can select other values, we found small value is ok.

    use_langevin_gradients = True  # False leaves it as Random-walk proposals. Note that Langevin gradients will take a bit more time computationally
    if output == 1:
        problemfolder = 'one_step_problemfolder/'
        problemfolder_db = 'one_step_results/'  # save main results
    else:
        problemfolder = 'problemfolder/'
        problemfolder_db = 'results/'

    filename = ""
    path = problemfolder + name
    if not os.path.exists(path):
        os.makedirs(path)
    else:
        shutil.rmtree(path)
        os.makedirs(path)

    path_db = problemfolder_db + name
    if not os.path.exists(path_db):
        os.makedirs(path_db)
    else:
        shutil.rmtree(path_db)
        os.makedirs(path_db)
    timer = time.time()

    langevin_prob = 0.5

    pt = ParallelTempering(use_langevin_gradients, learn_rate, traindata, testdata, topology, num_chains, maxtemp,
                            NumSample, swap_interval, langevin_prob, path)

    directories = [path + '/predictions/', path + '/posterior', path + '/results', path + '/surrogate',
                    path + '/surrogate/learnsurrogate_data', path + '/posterior/pos_w',
                    path + '/posterior/pos_likelihood', path + '/posterior/surg_likelihood',
                    path + '/posterior/accept_list']

    for d in directories:
        pt.make_directory(filename + d)

    pt.initialize_chains(burn_in)

    pos_w, fx_train, fx_test, rmse_train, rmse_test, indi_rmse_train, indi_rmse_test, mae_train, mae_test, mape_train, \
        mape_test, acc_train, acc_test, likelihood_rep, swap_perc, \
        accept_vec, accept, fx_test_all = pt.run_chains()

    list_end = accept_vec.shape[1]
    accept_ratio = accept_vec[:, list_end - 1:list_end] / list_end
    accept_per = np.mean(accept_ratio) * 100

    print(accept_per, ' accept_per')

    timer2 = time.time()

    timetotal = (timer2 - timer) / 60
    print(timetotal, 'min taken')
 

    final_metrics = []
    for metric in [rmse_train, rmse_test, mae_train, mae_test, mape_train, mape_test]:
        final_metrics.append(np.mean(metric))
        final_metrics.append(np.std(metric))
        final_metrics.append(np.amin(metric))
        # rmse_tr = np.mean(rmse_train[:])
        # rmsetr_std = np.std(rmse_train[:])
        # rmsetr_max = np.amin(rmse_train[:])
        #
        # rmse_tes = np.mean(rmse_test[:])
        # rmsetest_std = np.std(rmse_test[:])
        # rmsetes_max = np.amin(rmse_test[:])

    print( final_metrics, '  final_metrics')

    outres = open(path + '/result.txt', "a+")
    outres_db = open(path_db + '/result.txt', "a+")

    resultingfile = open(path + '/master_result_file.txt', 'a+')
    resultingfile_db = open(path_db + '/master_result_file.txt', 'a+')

    xv = name

    allres = np.asarray(
        [NumSample, maxtemp, swap_interval, langevin_prob, learn_rate, swap_perc, accept_per, timetotal] + final_metrics)

    np.savetxt(outres_db, allres, fmt='%1.4f', newline=' ')
    np.savetxt(resultingfile_db, allres, fmt='%1.4f', newline=' ')
    np.savetxt(resultingfile_db, [xv], fmt="%s", newline=' \n')

    np.savetxt(outres, allres, fmt='%1.4f', newline=' ')
    np.savetxt(resultingfile, allres, fmt='%1.4f', newline=' ')
    np.savetxt(resultingfile, [xv], fmt="%s", newline=' \n')

    np.savetxt(path_db + '/ptmcmc_pred_test_nor.txt', fx_test, fmt='%1.6f')

    n = len(y_test)
    indi_mae=sum(np.abs(y_test- fx_test)) / n
    indi_mape= sum(np.abs((y_test- fx_test) / (y_test + 1e-6))) / n * 100
    indi_rmse_cal=rmse = np.sqrt(sum(np.square(y_test- fx_test)) / n)
    np.savetxt(path_db + '/ptmcmc_indi_mae.txt', indi_mae, fmt='%1.6f')
    np.savetxt(path_db + '/ptmcmc_indi_mape.txt', indi_mape, fmt='%1.6f')
    np.savetxt(path_db + '/ptmcmc_indi_rmse.txt', indi_rmse_cal, fmt='%1.6f')


    fx_test = fx_test * (raw_max -raw_min)+ raw_min
    y_test = y_test * (raw_max -raw_min)+ raw_min
    np.savetxt(path_db + '/ptmcmc_test_y.txt', y_test, fmt='%1.6f')
    np.savetxt(path_db + '/ptmcmc_pred_test.txt', fx_test, fmt='%1.6f')

    x = np.linspace(0, rmse_train.shape[0], num=rmse_train.shape[0])

    # plt.plot(x, rmse_train, '.',   label='Test')
    # plt.plot(x, rmse_test,  '.', label='Train')
    # plt.legend(loc='upper right')
    #
    # plt.xlabel('Samples', fontsize=12)
    # plt.ylabel('RMSE', fontsize=12)
    #
    # plt.savefig(path+'/rmse_samples.png')
    # plt.clf()

    plt.plot(x, rmse_test.flatten(), label='Test')
    plt.plot(x, rmse_train.flatten(), label='Train')
    plt.legend(loc='upper right')

    plt.xlabel('Samples', fontsize=12)
    plt.ylabel('RMSE', fontsize=12)
    plt.title('{} ptmcmc rmse'.format(name))
    plt.savefig(path_db + '/rmse_samples.png')
    plt.clf()

    # plt.plot(x, rmse_test.flatten(), label='Test')
    # plt.plot(x, rmse_train.flatten(), label='Train')
    # plt.legend(loc='upper right')
    #
    # plt.xlabel('Samples', fontsize=12)
    # plt.ylabel('RMSE', fontsize=12)
    #
    # plt.savefig(path + '/rmse_samples.png')
    # plt.clf()
    fx_test_all = fx_test_all * (raw_max - raw_min) + raw_min
    fx_low = np.percentile(fx_test_all,5,axis=0)
    fx_high = np.percentile(fx_test_all,95,axis=0)
    print(np.shape(fx_high))
    x = np.linspace(1, testdata.shape[0], num=testdata.shape[0])
    if output != 1:
        for i in [0, 1, 4]:

            plt.plot(x, fx_test[:, i], label='Prediction')
            plt.plot(x, y_test[:, i], label='Actual')
            plt.plot(x, fx_low[:, i], label='Uncertainty',color='blue', linestyle='--',alpha=0.25)
            plt.plot(x, fx_high[:, i],color='blue',linestyle='--',alpha=0.25)
            plt.fill_between(x, fx_low[:, i], fx_high[:, i], facecolor='grey', alpha=0.2)
            plt.legend(loc='upper right')
            plt.xlabel('Time (days)')
            plt.ylabel('Closing Price (AUD)')
            #plt.title('{} ptmcmc five_steps_ahead_{}'.format(name, i + 1))
            plt.savefig(path_db + '/pred_test_{}.png'.format(i + 1))
            plt.clf()
    else:
        plt.plot(x, fx_test, label='Prediction')
        plt.plot(x, y_test, label='Actual')
        plt.legend(loc='upper right')
        plt.xlabel('Time (Day)')
        plt.ylabel('Closing Price (USD)')
        #plt.title('{} ptmcmc one_step_ahead'.format(name))
        plt.savefig(path_db + '/pred_test.png')
        plt.clf()

    likelihood = likelihood_rep[:, 0]  # just plot proposed likelihood
    likelihood = np.asarray(np.split(likelihood, num_chains))

    # Plots
    plt.plot(likelihood.T)

    plt.xlabel('Samples', fontsize=12)
    plt.ylabel(' Log-Likelihood', fontsize=12)

    plt.savefig(path + '/likelihood.pdf')
    plt.clf()

    plt.plot(likelihood.T)

    plt.xlabel('Samples', fontsize=12)
    plt.ylabel(' Log-Likelihood', fontsize=12)

    plt.savefig(path_db + '/likelihood.pdf')
    plt.clf()

    plt.plot(accept_vec.T)
    plt.xlabel('Samples', fontsize=12)
    plt.ylabel(' Number accepted proposals', fontsize=12)

    plt.savefig(path_db + '/accept.png')

    plt.clf()

    # mpl_fig = plt.figure()
    # ax = mpl_fig.add_subplot(111)

    # ax.boxplot(pos_w)

    # ax.set_xlabel('[W1] [B1] [W2] [B2]')
    # ax.set_ylabel('Posterior')

    # plt.legend(loc='upper right')

    # plt.title("Boxplot of Posterior W (weights and biases)")
    # plt.savefig(path+'/w_pos.png')
    # plt.savefig(path+'/w_pos.svg', format='svg', dpi=600)

    # plt.clf()
    # dir()
    gc.collect()
    outres.close()
    resultingfile.close()
    resultingfile_db.close()
    outres_db.close()

if __name__ == "__main__":
    main()