include/dcsam/DCFactor.h

/**
 * @file DCFactor.h
 * @brief Custom discrete-continuous factor
 * @author Kevin Doherty, kdoherty@mit.edu
 * Copyright 2021 The Ambitious Folks of the MRG
 */

#pragma once

#include <gtsam/discrete/DiscreteFactor.h>
#include <gtsam/discrete/DiscreteKey.h>
#include <gtsam/nonlinear/NonlinearFactor.h>
#include <gtsam/nonlinear/Symbol.h>
#include <math.h>

#include <algorithm>
#include <limits>
#include <string>
#include <vector>

#include "DCSAM_types.h"

namespace dcsam {

/**
 * @brief Abstract class implementing a discrete-continuous factor.
 *
 * keys_ member variable stores keys for *continuous* variables.
 * discreteKeys_ contains the keys (plus cardinalities) for *discrete*
 * variables.
 */
class DCFactor : public gtsam::Factor {
 protected:
  // Set of DiscreteKeys for this factor.
  gtsam::DiscreteKeys discreteKeys_;

 public:
  using Base = gtsam::Factor;

  DCFactor() = default;

  /**
   * Base constructor for a DCFactor from a set of discrete keys and continuous
   * keys
   *
   * @param continuousKeys - the keys for *continuous* variables
   * @param discreteKeys - the keys for *discrete* variables
   */
  DCFactor(const gtsam::KeyVector& continuousKeys,
           const gtsam::DiscreteKeys& discreteKeys)
      : Base(continuousKeys), discreteKeys_(discreteKeys) {}

  // NOTE unsure if needed?
  explicit DCFactor(const gtsam::DiscreteKeys& discreteKeys)
      : discreteKeys_(discreteKeys) {}

  DCFactor& operator=(const DCFactor& rhs) {
    Base::operator=(rhs);
    discreteKeys_ = rhs.discreteKeys_;
    return *this;
  }

  virtual ~DCFactor() = default;

  /**
   * Return the error for the DCFactor given an assignment to the variables
   * referenced by the discrete keys and the continuous keys (`keys_`).
   *
   * This will be specific to the model being implemented, so it is a pure
   * virtual function and must be overridden.
   *
   * NOTE: Depending on the application, it may be important that the error
   * function is *normalized*, i.e. it corresponds to a proper negative
   * log-likelihood, rather than the negative log-likelihood with normalization
   * constants discarded.
   *
   * @param continuousVals - the values assigned to the continuous variables,
   * must contain keys in keys_ member variable
   * @param discreteVals - likewise, the values assigned to discrete variables,
   * must contain keys in discreteKeys_
   * @return error (usually the negative log-likelihood) for the measurement
   * model as a double.
   */
  virtual double error(
      const gtsam::Values& continuousVals,
      const gtsam::DiscreteFactor::Values& discreteVals) const = 0;

  /**
   * Linearize the error function with respect to the continuous
   * variables (given in `keys_`) at the point specified by `continuousVals`.
   * Since this Jacobian can be dependent on the assignment to discrete
   * variables as well, they are required as a parameter.
   *
   * This will be specific to the model being implemented, so it is a pure
   * virtual function and must be overridden.
   *
   * @param continuousVals - Assignment to the continuous variables in `keys_`
   * @param discreteVals - Likewise, assignment to the discrete variables in
   * `discreteKeys__`.
   */
  virtual boost::shared_ptr<gtsam::GaussianFactor> linearize(
      const gtsam::Values& continuousVals,
      const DiscreteValues& discreteVals) const = 0;

  /**
   * Returns true when the DCFactor is equal to `other`
   *
   * This will be specific to the model being implemented, so it is a pure
   * virtual function and must be overridden.
   *
   * @param other - the DCFactor for which to test equality.
   * @param tol = 1e-9 - numerical tolerance for any floating point comparisons.
   */
  virtual bool equals(const DCFactor& other, double tol = 1e-9) const = 0;

  /**
   * Returns the number of rows in the Jacobian with respect to the continuous
   * variables for this factor. Internally this is used in the conversion to a
   * gtsam::NonlinearFactor
   *
   * TODO(kevin): not sure if needed???
   *
   * This will be specific to the model being implemented, so it is a pure
   * virtual function and must be overridden
   *
   * @return the dimension (number of rows) in the Jacobian of the `error`
   * function with respect to continuous variables for
   */
  virtual size_t dim() const = 0;

  /*
   * Return the discrete keys for this factor.
   */
  gtsam::DiscreteKeys discreteKeys() const { return discreteKeys_; }

  /**
   * Converts the DCFactor to a gtsam::DecisionTreeFactor. Internally, this will
   * be used to generate a gtsam::DiscreteFactor type, which itself requires a
   * conversion function to gtsam::DecisionTreeFactor for inference using GTSAM.
   *
   * Performing this conversion can be problem specific, so we allow for the
   * option to override, but try to implement a sensible default: we assume the
   * error function can be called setting each discrete key's variable
   * individually, and the overall DCFactor can itself be factored as a product
   * of unary gtsam::DecisionTreeFactors.
   *
   * Alternative implementations might consider something like the
   * gtsam::AllDiff approach here:
   * https://github.com/borglab/gtsam/blob/43e8f1e5aeaf11890262722c1e5e04a11dbf9d75/gtsam_unstable/discrete/AllDiff.cpp#L43
   *
   * @param continuousVals - an assignment to the continuous variables
   * @param discreteVals -
   * @return a gtsam::DecisionTreeFactor implementing this DCFactor.
   */
  virtual gtsam::DecisionTreeFactor toDecisionTreeFactor(
      const gtsam::Values& continuousVals,
      const DiscreteValues& discreteVals) const {
    gtsam::DecisionTreeFactor converted;
    for (const gtsam::DiscreteKey& dkey : discreteKeys_) {
      std::vector<double> probs = evalProbs(dkey, continuousVals);
      // Cardinality of gtsam::DiscreteKey is located at `second`
      assert(probs.size() == dkey.second);
      gtsam::DecisionTreeFactor unary(dkey, probs);
      converted = converted * unary;
    }
    return converted;
  }

  /**
   * Calculate a normalizing constant for this DCFactor. Most implementations
   * will be able to use the helper function
   * nonlinearFactorLogNormalizingConstant provided below for most of the
   * calculation.
   * TODO(Kurran) is this the cleanest way to do this? Seems necessary for the
   * DCMaxMixtureFactor implementations etc...
   */
  virtual double logNormalizingConstant(const gtsam::Values& values) const {
    throw std::logic_error(
        "Normalizing constant not implemented."
        "One or more of the factors in use requires access to the normalization"
        "constant for a child class of DCFactor, but`logNormalizingConstant` "
        "has not been overridden.");
  }

  /**
   * Default for computing the _negative_ normalizing constant for the
   * measurement likelihood (since we are minimizing the _negative_
   * log-likelihood), to be used as a utility for computing the
   * DCFactorLogNormalizingConstant.
   */
  template <typename NonlinearFactorType>
  double nonlinearFactorLogNormalizingConstant(
      const NonlinearFactorType& factor, const gtsam::Values& values) const {
    // Information matrix (inverse covariance matrix) for the factor.
    gtsam::Matrix infoMat;

    // NOTE: This is sloppy, is there a cleaner way?
    boost::shared_ptr<NonlinearFactorType> fPtr =
        boost::make_shared<NonlinearFactorType>(factor);
    boost::shared_ptr<NonlinearFactorType> factorPtr(fPtr);

    // If this is a NoiseModelFactor, we'll use its noiseModel to
    // otherwise noiseModelFactor will be nullptr
    boost::shared_ptr<gtsam::NoiseModelFactor> noiseModelFactor =
        boost::dynamic_pointer_cast<gtsam::NoiseModelFactor>(factorPtr);
    if (noiseModelFactor) {
      // If dynamic cast to NoiseModelFactor succeeded, see if the noise model
      // is Gaussian
      gtsam::noiseModel::Base::shared_ptr noiseModel =
          noiseModelFactor->noiseModel();

      boost::shared_ptr<gtsam::noiseModel::Gaussian> gaussianNoiseModel =
          boost::dynamic_pointer_cast<gtsam::noiseModel::Gaussian>(noiseModel);
      if (gaussianNoiseModel) {
        // If the noise model is Gaussian, retrieve the information matrix
        infoMat = gaussianNoiseModel->information();
      } else {
        // If the factor is not a Gaussian factor, we'll linearize it to get
        // something with a normalized noise model
        // TODO(kevin): does this make sense to do? I think maybe not in
        // general? Should we just yell at the user?
        boost::shared_ptr<gtsam::GaussianFactor> gaussianFactor =
            factor.linearize(values);
        infoMat = gaussianFactor->information();
      }
    }

    // Compute the (negative) log of the normalizing constant
    return -(factor.dim() * log(2.0 * M_PI) / 2.0) -
           (log(infoMat.determinant()) / 2.0);
  }

  /**
   * Obtain the likelihood function for a single discrete variable conditioned
   * on continuous values. Since the `error` function typically represents the
   * negative log-likelihood, we compute `exp(-error)`.
   *
   * NOTE: Depending on the application, it may be important that the error
   * function is *normalized*, i.e. it corresponds to a proper negative
   * log-likelihood, rather than the negative log-likelihood with normalization
   * constants discarded.
   *
   * For this, we assume that the `error` function can be called with only a
   * single discrete value set, though this may be dependent on the particular
   * implementation behavior desired. At present, this is only used internally
   * to specify the default behavior for `toDecisionTreeFactor`.
   *
   * @param dk - the discrete key to evaluate the likelihood for
   * @param continuousVals - an assignment to the continuous valued variables
   * @return a vector of length == cardinality of dk specifying the probability
   * of each possible assignment to dk.
   */
  std::vector<double> evalProbs(const gtsam::DiscreteKey& dk,
                                const gtsam::Values& continuousVals) const {
    /*
     * Normalizing a set of log probabilities in a numerically stable way is
     * tricky. To avoid overflow/underflow issues, we compute the largest
     * (finite) log probability and subtract it from each log probability before
     * normalizing. This comes from the observation that if:
     *    p_i = exp(L_i) / ( sum_j exp(L_j) ),
     * Then,
     *    p_i = exp(Z) exp(L_i - Z) / (exp(Z) sum_j exp(L_j - Z)),
     *        = exp(L_i - Z) / ( sum_j exp(L_j - Z) )
     *
     * Setting Z = max_j L_j, we can avoid numerical issues that arise when all
     * of the (unnormalized) log probabilities are either very large or very
     * small.
     */
    std::vector<double> logProbs;
    double maxLogProb = -std::numeric_limits<double>::infinity();
    for (size_t i = 0; i < dk.second; i++) {
      DiscreteValues testDiscreteVals;
      testDiscreteVals[dk.first] = i;
      // Recall: `error` returns -log(prob), so we compute exp(-error) to
      // recover probability
      double logProb = -error(continuousVals, testDiscreteVals);
      logProbs.push_back(logProb);
      if ((logProb != std::numeric_limits<double>::infinity()) &&
          logProb > maxLogProb) {
        maxLogProb = logProb;
      }
    }

    // After computing the max = "Z" of the log probabilities L_i, we compute
    // the log of the normalizing constant, log S, where S = sum_j exp(L_j - Z).
    double total = 0.0;
    for (size_t i = 0; i < dk.second; i++) {
      double probPrime = exp(logProbs[i] - maxLogProb);
      total += probPrime;
    }
    double logTotal = log(total);

    // Now we compute the (normalized) probability (for each i):
    // p_i = exp(L_i - Z - log S)
    double checkNormalization = 0.0;
    std::vector<double> probs;
    for (size_t i = 0; i < dk.second; i++) {
      double prob = exp(logProbs[i] - maxLogProb - logTotal);
      probs.push_back(prob);
      checkNormalization += prob;
    }

    // Numerical tolerance for floating point comparisons
    double tol = 1e-9;

    if (!gtsam::fpEqual(checkNormalization, 1.0, tol)) {
      std::string errMsg =
          std::string(
              "DCFactor::evalProbs failed to normalize probabilities. ") +
          std::string("Expected value 1.0. Got value: ") +
          std::to_string(checkNormalization) +
          std::string(
              "\n This could have resulted from numerical overflow/underflow.");
      throw std::logic_error(errMsg);
    }

    return probs;
  }

  /**
   * Take the product of this DCFactor (as a gtsam::DecisionTreeFactor)
   * conditioned on an assignment to the continous variables, `continuousVals`
   * with another gtsam::DecisionTreeFactor `f`. Used internally by GTSAM to
   * solve discrete factor graphs.
   *
   * @param f - the gtsam::DecisionTreeFactor to be multiplied by this DCFactor
   * @param continuousVals - an assignment to the continuous variables
   * (specified by keys_).
   * @return a gtsam::DecisionTreeFactor representing the product of this factor
   * with `f`.
   */
  gtsam::DecisionTreeFactor conditionalTimes(
      const gtsam::DecisionTreeFactor& f, const gtsam::Values& continuousVals,
      const DiscreteValues& discreteVals) const {
    return toDecisionTreeFactor(continuousVals, discreteVals) * f;
  }
};
}  // namespace dcsam