src/Eigen2Support/LeastSquares.h

c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath// This file is part of Eigen, a lightweight C++ template library
7faaa9f3f0df9d23790277834d426c3d992ac3baCarlos Hernandez// for linear algebra.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath//
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath// Copyright (C) 2006-2009 Benoit Jacob <jacob.benoit.1@gmail.com>
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath//
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath// This Source Code Form is subject to the terms of the Mozilla
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath// Public License v. 2.0. If a copy of the MPL was not distributed
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#ifndef EIGEN2_LEASTSQUARES_H
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#define EIGEN2_LEASTSQUARES_H
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathnamespace Eigen {
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/** \ingroup LeastSquares_Module
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \leastsquares_module
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * For a set of points, this function tries to express
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * one of the coords as a linear (affine) function of the other coords.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * This is best explained by an example. This function works in full
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * generality, for points in a space of arbitrary dimension, and also over
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * the complex numbers, but for this example we will work in dimension 3
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * over the real numbers (doubles).
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * So let us work with the following set of 5 points given by their
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f$(x,y,z)\f$ coordinates:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @code
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    Vector3d points[5];
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    points[0] = Vector3d( 3.02, 6.89, -4.32 );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    points[1] = Vector3d( 2.01, 5.39, -3.79 );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    points[2] = Vector3d( 2.41, 6.01, -4.01 );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    points[3] = Vector3d( 2.09, 5.55, -3.86 );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    points[4] = Vector3d( 2.58, 6.32, -4.10 );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @endcode
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Suppose that we want to express the second coordinate (\f$y\f$) as a linear
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * expression in \f$x\f$ and \f$z\f$, that is,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f[ y=ax+bz+c \f]
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * for some constants \f$a,b,c\f$. Thus, we want to find the best possible
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * constants \f$a,b,c\f$ so that the plane of equation \f$y=ax+bz+c\f$ fits
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * best the five above points. To do that, call this function as follows:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @code
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    Vector3d coeffs; // will store the coefficients a, b, c
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    linearRegression(
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath      5,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath      &points,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath      &coeffs,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath      1 // the coord to express as a function of
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath        // the other ones. 0 means x, 1 means y, 2 means z.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    );
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @endcode
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Now the vector \a coeffs is approximately
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f$( 0.495 ,  -1.927 ,  -2.906 )\f$.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Thus, we get \f$a=0.495, b = -1.927, c = -2.906\f$. Let us check for
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * instance how near points[0] is from the plane of equation \f$y=ax+bz+c\f$.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Looking at the coords of points[0], we see that:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f[ax+bz+c = 0.495 * 3.02 + (-1.927) * (-4.32) + (-2.906) = 6.91.\f]
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * On the other hand, we have \f$y=6.89\f$. We see that the values
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f$6.91\f$ and \f$6.89\f$
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * are near, so points[0] is very near the plane of equation \f$y=ax+bz+c\f$.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Let's now describe precisely the parameters:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @param numPoints the number of points
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @param points the array of pointers to the points on which to perform the linear regression
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @param result pointer to the vector in which to store the result.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  This vector must be of the same type and size as the
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  data points. The meaning of its coords is as follows.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  For brevity, let \f$n=Size\f$,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  \f$r_i=result[i]\f$,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  and \f$f=funcOfOthers\f$. Denote by
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  \f$x_0,\ldots,x_{n-1}\f$
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  the n coordinates in the n-dimensional space.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  Then the resulting equation is:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                  \f[ x_f = r_0 x_0 + \cdots + r_{f-1}x_{f-1}
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                   + r_{f+1}x_{f+1} + \cdots + r_{n-1}x_{n-1} + r_n. \f]
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * @param funcOfOthers Determines which coord to express as a function of the
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                        others. Coords are numbered starting from 0, so that a
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                        value of 0 means \f$x\f$, 1 means \f$y\f$,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                        2 means \f$z\f$, ...
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \sa fitHyperplane()
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  */
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathtemplate<typename VectorType>
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathvoid linearRegression(int numPoints,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                      VectorType **points,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                      VectorType *result,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                      int funcOfOthers )
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath{
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  typedef typename VectorType::Scalar Scalar;
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  typedef Hyperplane<Scalar, VectorType::SizeAtCompileTime> HyperplaneType;
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  const int size = points[0]->size();
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  result->resize(size);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  HyperplaneType h(size);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  fitHyperplane(numPoints, points, &h);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  for(int i = 0; i < funcOfOthers; i++)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    result->coeffRef(i) = - h.coeffs()[i] / h.coeffs()[funcOfOthers];
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  for(int i = funcOfOthers; i < size; i++)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    result->coeffRef(i) = - h.coeffs()[i+1] / h.coeffs()[funcOfOthers];
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath}
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/** \ingroup LeastSquares_Module
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \leastsquares_module
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * This function is quite similar to linearRegression(), so we refer to the
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * documentation of this function and only list here the differences.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * The main difference from linearRegression() is that this function doesn't
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * take a \a funcOfOthers argument. Instead, it finds a general equation
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * of the form
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f[ r_0 x_0 + \cdots + r_{n-1}x_{n-1} + r_n = 0, \f]
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * where \f$n=Size\f$, \f$r_i=retCoefficients[i]\f$, and we denote by
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \f$x_0,\ldots,x_{n-1}\f$ the n coordinates in the n-dimensional space.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * Thus, the vector \a retCoefficients has size \f$n+1\f$, which is another
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * difference from linearRegression().
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * In practice, this function performs an hyper-plane fit in a total least square sense
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * via the following steps:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *  1 - center the data to the mean
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *  2 - compute the covariance matrix
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *  3 - pick the eigenvector corresponding to the smallest eigenvalue of the covariance matrix
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * The ratio of the smallest eigenvalue and the second one gives us a hint about the relevance
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * of the solution. This value is optionally returned in \a soundness.
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  *
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  * \sa linearRegression()
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  */
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathtemplate<typename VectorType, typename HyperplaneType>
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathvoid fitHyperplane(int numPoints,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                   VectorType **points,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                   HyperplaneType *result,
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath                   typename NumTraits<typename VectorType::Scalar>::Real* soundness = 0)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath{
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  typedef typename VectorType::Scalar Scalar;
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  typedef Matrix<Scalar,VectorType::SizeAtCompileTime,VectorType::SizeAtCompileTime> CovMatrixType;
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  EIGEN_STATIC_ASSERT_VECTOR_ONLY(VectorType)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  ei_assert(numPoints >= 1);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  int size = points[0]->size();
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  ei_assert(size+1 == result->coeffs().size());
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  // compute the mean of the data
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  VectorType mean = VectorType::Zero(size);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  for(int i = 0; i < numPoints; ++i)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    mean += *(points[i]);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  mean /= numPoints;
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  // compute the covariance matrix
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  CovMatrixType covMat = CovMatrixType::Zero(size, size);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  VectorType remean = VectorType::Zero(size);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  for(int i = 0; i < numPoints; ++i)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  {
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    VectorType diff = (*(points[i]) - mean).conjugate();
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    covMat += diff * diff.adjoint();
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  }
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  // now we just have to pick the eigen vector with smallest eigen value
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  SelfAdjointEigenSolver<CovMatrixType> eig(covMat);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  result->normal() = eig.eigenvectors().col(0);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  if (soundness)
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    *soundness = eig.eigenvalues().coeff(0)/eig.eigenvalues().coeff(1);
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  // let's compute the constant coefficient such that the
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  // plane pass trough the mean point:
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  result->offset() = - (result->normal().cwise()* mean).sum();
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath}
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath} // end namespace Eigen
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#endif // EIGEN2_LEASTSQUARES_H