src/vegasflow/vflow.py

"""
    This module contains the VegasFlow class and all its auxiliary functions

    The main interfaces of this class are the class `VegasFlow` and the
    `vegas_wrapper`
"""
import json
import numpy as np
import tensorflow as tf

from vegasflow.configflow import (
    DTYPE,
    DTYPEINT,
    fone,
    fzero,
    float_me,
    ione,
    int_me,
    BINS_MAX,
    ALPHA,
)
from vegasflow.monte_carlo import MonteCarloFlow, wrapper, sampler
from vegasflow.utils import consume_array_into_indices

import logging

logger = logging.getLogger(__name__)

FBINS = float_me(BINS_MAX)


@tf.function(
    input_signature=[
        tf.TensorSpec(shape=[None, None], dtype=DTYPE),
        tf.TensorSpec(shape=[None, BINS_MAX + 1], dtype=DTYPE),
    ]
)
def importance_sampling_digest(xn, divisions):
    """Importance sampling algorithm:
    receives a random array (number of dimensions, number of dim)
    containing information about from which bins in the
    grid (n_dims, BINS_MAX+1) the random points have to be sampled

    This algorithm is shared between the simplest form of Vegas
    (VegasFlow: only importance sampling)
    and Vegas+ (VegasFlowPlus: importance and stratified sampling)
    and so it has been lifted to its own function

    Parameters:
    ----------
        xn: float tensor (n_dim, n_events)
            which bins to sample from
        divisions: float tensor (n_dims, BINS_MAX+1)
            grid of divisions for the importance sampling algorithm

    Returns
    -------
        ind_i: integer tensor (n_events, n_dim)
            index in the divisions grid from which the points should be sampled
        x: float tensor (n_events, n_dim)
            random values sampled in the divisions grid
        xdelta: float tensor (n_events,)
            weight of the random points
    """
    ind_i = int_me(xn)
    # Get the value of the left and right sides of the bins
    ind_f = ind_i + ione
    x_ini = tf.gather(divisions, ind_i, batch_dims=1)
    x_fin = tf.gather(divisions, ind_f, batch_dims=1)
    # Compute the width of the bins
    xdelta = x_fin - x_ini
    # Take the decimal part of bin (i.e., how deep within the bin)
    aux_rand = xn - tf.math.floor(xn)
    x = x_ini + xdelta * aux_rand
    # Compute the weight of the points
    weights = tf.reduce_prod(xdelta * FBINS, axis=0)

    # Tranpose the output to be what the external functions expect
    x = tf.transpose(x)
    ind_i = tf.transpose(ind_i)
    return ind_i, x, weights


# Auxiliary functions for Vegas
@tf.function(
    input_signature=[
        tf.TensorSpec(shape=[None, None], dtype=DTYPE),
        tf.TensorSpec(shape=[None, BINS_MAX + 1], dtype=DTYPE),
    ]
)
def _generate_random_array(rnds, divisions):
    """
    Generates the Vegas random array for any number of events

    Parameters
    ----------
        rnds: array shaped (None, n_dim)
            Random numbers used as an input for Vegas
        divisions: array shaped (n_dim, BINS_MAX+1)
            vegas grid

    Returns
    -------
        x: array (None, n_dim)
            Vegas random output
        w: array (None,)
            Weight of each set of (n_dim) random numbers
        div_index: array (None, n_dim)
            division index in which each (n_dim) set of random numbers fall
    """
    # Get the boundaries of the random numbers
    #     reg_i = fzero
    #     reg_f = fone
    # Get the index of the division we are interested in
    xn = FBINS * (fone - tf.transpose(rnds))

    # Compute the random number between 0 and 1
    # and the index of the bin where it has been sampled from
    ind_xn, x, weights = importance_sampling_digest(xn, divisions)

    # Compute the random number between the limits
    # commented, for now only from 0 to 1
    #     x = reg_i + rand_x * (reg_f - reg_i)
    return x, weights, ind_xn


@tf.function(
    input_signature=[
        tf.TensorSpec(shape=[BINS_MAX], dtype=DTYPE),
        tf.TensorSpec(shape=[BINS_MAX + 1], dtype=DTYPE),
    ]
)
def refine_grid_per_dimension(t_res_sq, subdivisions):
    """
    Modifies the boundaries for the vegas grid for a given dimension

    Parameters
    ----------
        `t_res_sq`: tensor
            array of results squared per bin
        `subdivision`: tensor
            current boundaries for the grid

    Returns
    -------
        `new_divisions`: tensor
            array with the new boundaries of the grid
    """
    # Define some constants
    paddings = int_me([[1, 1]])
    tmp_meaner = tf.fill([BINS_MAX - 2], float_me(3.0))
    meaner = tf.pad(tmp_meaner, paddings, constant_values=2.0)
    # Pad the vector of results
    res_padded = tf.pad(t_res_sq, paddings)
    # First we need to smear out the array of results squared
    smeared_tensor_tmp = res_padded[1:-1] + res_padded[2:] + res_padded[:-2]
    smeared_tensor = tf.maximum(smeared_tensor_tmp / meaner, float_me(1e-30))
    # Now we refine the grid according to
    # journal of comp phys, 27, 192-203 (1978) G.P. Lepage
    sum_t = tf.reduce_sum(smeared_tensor)
    log_t = tf.math.log(smeared_tensor)
    aux_t = (1.0 - smeared_tensor / sum_t) / (tf.math.log(sum_t) - log_t)
    wei_t = tf.pow(aux_t, ALPHA)
    ave_t = tf.reduce_sum(wei_t) / BINS_MAX

    ###### Auxiliary functions for the while loop
    @tf.function
    def while_check(bin_weight, *args):
        """Checks whether the bin has enough weight
        to beat the average"""
        return bin_weight < ave_t

    @tf.function(
        input_signature=[
            tf.TensorSpec(shape=[], dtype=DTYPE),
            tf.TensorSpec(shape=[], dtype=DTYPEINT),
            tf.TensorSpec(shape=[], dtype=DTYPE),
            tf.TensorSpec(shape=[], dtype=DTYPE),
        ]
    )
    def while_body(bin_weight, n_bin, cur, prev):
        """Fills the bin weight until it surpassed the avg
        once it's done, returns the limits of the last bin"""
        n_bin += 1
        bin_weight += wei_t[n_bin]
        prev = cur
        cur = subdivisions[n_bin + 1]
        return bin_weight, n_bin, cur, prev

    ###########################

    # And now resize all bins
    new_bins = [fzero]
    # Auxiliary variables
    bin_weight = fzero
    n_bin = -1
    cur = fzero
    prev = fzero
    for _ in range(BINS_MAX - 1):
        bin_weight, n_bin, cur, prev = tf.while_loop(
            while_check,
            while_body,
            (bin_weight, n_bin, cur, prev),
            parallel_iterations=1,
        )
        bin_weight -= ave_t
        delta = (cur - prev) * bin_weight / wei_t[n_bin]
        new_bins.append(cur - delta)
    new_bins.append(fone)

    new_divisions = tf.stack(new_bins)
    return new_divisions


####### VegasFlow
class VegasFlow(MonteCarloFlow):
    """
    Implementation of the important sampling algorithm from Vegas.

    Parameters
    ----------
        n_dim: int
            number of dimensions to be integrated
        n_events: int
            number of events per iteration
        train: bool
            whether to train the grid
        main_dimension: int
            in case of vectorial output, main dimenison in which to train
    """

    def __init__(self, n_dim, n_events, train=True, main_dimension=0, **kwargs):
        super().__init__(n_dim, n_events, **kwargs)

        # If training is True, the grid will be changed after every iteration
        # otherwise it will be frozen
        self.train = train

        # Initialize grid
        self.grid_bins = BINS_MAX + 1
        subdivision_np = np.linspace(0, 1, self.grid_bins)
        divisions_np = subdivision_np.repeat(n_dim).reshape(-1, n_dim).T
        self.divisions = tf.Variable(divisions_np, dtype=DTYPE)
        self._main_dimension = main_dimension

    def _can_run_vectorial(self, expected_shape):
        # only implemented for the main class at the moment, not for children
        if self._main_dimension >= expected_shape[-1]:
            raise ValueError(
                f"""The main dimension index ({self._main_dimension}) is greater than the dimensionality of the output ({expected_shape[-1]}).
            Remember that arrays in python are 0-indexed!"""
            )
        return self.__class__.__name__ == "VegasFlow"

    def make_differentiable(self):
        """Freeze the grid if the function is to be called within a graph"""
        if self.train:
            logger.warning("Freezing the grid")
            self.freeze_grid()
        return super().make_differentiable()

    def freeze_grid(self):
        """Stops the grid from refining any more"""
        self.train = False
        self._recompile()

    def unfreeze_grid(self):
        """Enable the refining of the grid"""
        self.train = True
        self._recompile()

    def save_grid(self, file_name):
        """Save the `divisions` array in a json file

        Parameters
        ----------
            `file_name`: str
            Filename in which to save the checkpoint
        """
        div_np = self.divisions.numpy()
        if self._integrand:
            int_name = self._integrand.__name__
        else:
            int_name = ""
        json_dict = {
            "dimensions": self.n_dim,
            "ALPHA": ALPHA,
            "BINS": self.grid_bins,
            "integrand": int_name,
            "grid": div_np.tolist(),
        }
        with open(file_name, "w") as f:
            json.dump(json_dict, f, indent=True)

    def load_grid(self, file_name=None, numpy_grid=None):
        """Load the `divisions` array from a json file
        or from a numpy_array

        Parameters
        ----------
            `file_name`: str
            Filename in which the grid json is stored
            `numpy_grid`: np.array
            Numpy array to substitute divisions with
        """
        if file_name is not None and numpy_grid is not None:
            raise ValueError(
                "Received both a numpy grid and a file_name to load the grid from."
                "Ambiguous call to `load_grid`"
            )

        # If it received a file, loads up the grid
        if file_name:
            with open(file_name, "r") as f:
                json_dict = json.load(f)
            # First check the parameters of the grid are unchanged
            grid_dim = json_dict.get("dimensions")
            grid_bins = json_dict.get("BINS")
            # Check that the integrand is the same one
            if self._integrand:
                integrand_name = self._integrand.__name__
                integrand_grid = json_dict.get("integrand")
                if integrand_name != integrand_grid:
                    logger.warning(
                        f"The grid was written for the integrand: {integrand_grid}"
                        f"which is different from {integrand_name}"
                    )
            # Now that everything is clear, let's load up the grid
            numpy_grid = np.array(json_dict["grid"])
        elif numpy_grid is not None:
            grid_dim = numpy_grid.shape[0]
            grid_bins = numpy_grid.shape[1]
        else:
            raise ValueError("load_grid was called but no grid was provided!")
        # Check that the grid has the right dimensions
        if grid_dim is not None and self.n_dim != grid_dim:
            raise ValueError(
                f"Received a {grid_dim}-dimensional grid while VegasFlow"
                f"was instantiated with {self.n_dim} dimensions"
            )
        if grid_bins is not None and self.grid_bins != grid_bins:
            raise ValueError(
                f"The received grid contains {grid_bins} bins while the"
                f"current settings is of {self.grid_bins} bins"
            )
        if file_name:
            logger.info(f" > SUCCESS: Loaded grid from {file_name}")
        self.divisions.assign(numpy_grid)

    def refine_grid(self, arr_res2):
        """Receives an array with the values of the integral squared per
        bin per dimension (`arr_res2.shape = (n_dim, self.grid_bins)`)
        and reshapes the `divisions` attribute accordingly

        Parameters
        ----------
            `arr_res2`: result the integrand sq per dimension and grid bin

        Function not compiled
        """
        for j in range(self.n_dim):
            new_divisions = refine_grid_per_dimension(arr_res2[j, :], self.divisions[j, :])
            self.divisions[j, :].assign(new_divisions)

    def _digest_random_generation(self, rnds):
        """Generates ``n_events`` random numbers sampled in the
        adapted Vegas Grid"""
        x, w, ind = _generate_random_array(rnds, self.divisions)
        return x, w, ind

    def _importance_sampling_array_filling(self, results2, indices):
        """Receives an array of results squared for every event
        and an array of indices describing in which bin each result fall.
        Fills a array with the total result in each bin to be used by
        the importance sampling algorithm
        """
        if not self.train:
            return []

        arr_res2 = []
        # If the training is active, save the result of the integral sq
        for j in range(self.n_dim):
            arr_res2.append(
                consume_array_into_indices(
                    results2, indices[:, j : j + 1], int_me(self.grid_bins - 1)
                )
            )
        return tf.reshape(arr_res2, (self.n_dim, -1))

    def _run_event(self, integrand, ncalls=None):
        """Runs one step of Vegas.

        Parameters
        ----------
            `integrand`: function to integrate
            `ncalls`: how many events to run in this step

        Returns
        -------
            `res`: sum of the result of the integrand for all events
            `res2`: sum of the result squared of the integrand for all events
            `arr_res2`: result of the integrand squared per dimension and grid bin
        """
        if ncalls is None:
            n_events = self.n_events
        else:
            n_events = ncalls

        # Generate all random number for this iteration
        x, xjac, ind = self._generate_random_array(n_events)

        # Now compute the integrand
        int_result = integrand(x, weight=xjac)

        if self._vectorial:
            xjac = tf.reshape(xjac, (-1, 1))
        tmp = xjac * int_result
        tmp2 = tf.square(tmp)

        # Compute the final result for this step
        res = tf.reduce_sum(tmp, axis=0)
        res2 = tf.reduce_sum(tmp2, axis=0)

        # If this is a vectorial integrand, make sure that only the main dimension
        # is used for the grid training
        if self._vectorial:
            tmp2 = tmp2[:, self._main_dimension]

        arr_res2 = self._importance_sampling_array_filling(tmp2, ind)

        return res, res2, arr_res2

    def _iteration_content(self):
        """Steps to follow per iteration"""
        # Compute the result
        res, res2, arr_res2 = self.run_event()
        # Compute the error
        err_tmp2 = (self.n_events * res2 - tf.square(res)) / (self.n_events - fone)
        sigma = tf.sqrt(tf.maximum(err_tmp2, fzero))
        # If training is active, act post integration
        if self.train:
            self.refine_grid(arr_res2)
        return res, sigma

    def _run_iteration(self):
        """Runs one iteration of the Vegas integrator"""
        return self._iteration_content()


def vegas_wrapper(integrand, n_dim, n_iter, total_n_events, **kwargs):
    """Convenience wrapper

    Parameters
    ----------
        `integrand`: tf.function
        `n_dim`: number of dimensions
        `n_iter`: number of iterations
        `n_events`: number of events per iteration

    Returns
    -------
        `final_result`: integral value
        `sigma`: monte carlo error
    """
    return wrapper(VegasFlow, integrand, n_dim, n_iter, total_n_events, **kwargs)


def vegas_sampler(*args, **kwargs):
    """Convenience wrapper for sampling random numbers

    Parameters
    ----------
        `integrand`: tf.function
        `n_dim`: number of dimensions
        `n_events`: number of events per iteration
        `training_steps`: number of training_iterations

    Returns
    -------
        `sampler`: a reference to the generate_random_array method of the integrator class
    """
    return sampler(VegasFlow, *args, **kwargs)