shogun-toolbox · gf712 · Oct 23, 2019 · Oct 23, 2019 · Oct 24, 2019 · Oct 23, 2019
diff --git a/src/shogun/kernel/GaussianKernel.cpp b/src/shogun/kernel/GaussianKernel.cpp
@@ -6,12 +6,15 @@
  *          Tonmoy Saikia, Sergey Lisitsyn, Matt Aasted, Sanuj Sharma
  */
 
+#include <Eigen/Core>
+#include <unsupported/Eigen/AutoDiff>
 #include <shogun/lib/common.h>
 #include <shogun/kernel/GaussianKernel.h>
 #include <shogun/features/DotFeatures.h>
 #include <shogun/distance/EuclideanDistance.h>
 #include <shogun/mathematics/Math.h>
 
+
 using namespace shogun;
 
 CGaussianKernel::CGaussianKernel() : CShiftInvariantKernel()
@@ -88,21 +91,42 @@ void CGaussianKernel::set_width(float64_t w)
 	m_log_width = std::log(w / 2.0) / 2.0;
 }
 
+auto CGaussianKernel::kernel_function(int32_t idx_a, int32_t idx_b) const
+{
+	// this could be written as Eigen::Matrix<float64_t, n_differentiable_params, 1>;
+	using EigenScalar = Eigen::Matrix<float64_t, 1, 1>;
+	Eigen::AutoDiffScalar<EigenScalar> eigen_log_width(m_log_width);
+	// resize(n_differentiable_params)
+	eigen_log_width.derivatives().resize(1);
+	// this could be written as 
+	// eigen_log_width.derivatives() = EigenScalar::Unit(1,i);
+	// where i is the idx of the adjoint
+	eigen_log_width.derivatives() = EigenScalar::Unit(1,0);
+	auto el = CShiftInvariantKernel::distance(idx_a, idx_b);
+	return exp(-el / (exp(eigen_log_width * 2.0) * 2.0));
+}
+
 SGMatrix<float64_t> CGaussianKernel::get_parameter_gradient(const TParameter* param, index_t index)
 {
+	using std::exp;
+
 	require(lhs, "Left hand side features must be set!");
-	require(rhs, "Rightt hand side features must be set!");
+	require(rhs, "Right hand side features must be set!");
 
 	if (!strcmp(param->m_name, "log_width"))
 	{
 		SGMatrix<float64_t> derivative=SGMatrix<float64_t>(num_lhs, num_rhs);
+
 		for (int k=0; k<num_rhs; k++)
 		{
 #pragma omp parallel for
 			for (int j=0; j<num_lhs; j++)
 			{
-				float64_t element=distance(j, k);
-				derivative(j, k) = std::exp(-element) * element * 2.0;
+				// this could be written as Eigen::Matrix<float64_t, n_differentiable_params, 1>;
+				using EigenScalar = Eigen::Matrix<float64_t, 1, 1>;
+				Eigen::AutoDiffScalar<EigenScalar> kernel = kernel_function(j, k);
+				// 0 is the index of the width parameter
+				derivative(j, k) = kernel.derivatives()(0);
 			}
 		}
 		return derivative;
@@ -116,9 +140,11 @@ SGMatrix<float64_t> CGaussianKernel::get_parameter_gradient(const TParameter* pa
 
 float64_t CGaussianKernel::compute(int32_t idx_a, int32_t idx_b)
 {
-    float64_t result=distance(idx_a, idx_b);
-	return std::exp(-result);
-}
+	// this could be written as Eigen::Matrix<float64_t, n_differentiable_params, 1>;
+	using EigenScalar = Eigen::Matrix<float64_t, 1, 1>;
+	Eigen::AutoDiffScalar<EigenScalar> kernel = kernel_function(idx_a, idx_b);
+    return kernel.value();
+}	
 
 void CGaussianKernel::load_serializable_post() noexcept(false)
 {

diff --git a/src/shogun/kernel/GaussianKernel.h b/src/shogun/kernel/GaussianKernel.h
@@ -123,6 +123,15 @@ class CGaussianKernel: public CShiftInvariantKernel
 		return std::exp(m_log_width * 2.0) * 2.0;
 	}
 
+#ifndef SWIG
+	/**
+	 *	Returns a lazily evaluated Eigen expression template
+	 *  that tracks the gradient of differentiable hyperparameters
+	 * 
+	 * @return expression template of kernel function
+	 */
+	auto kernel_function(int32_t idx_a, int32_t idx_b) const;
+#endif
 	/** return derivative with respect to specified parameter
 	 *
 	 * @param param the parameter