gradient descent (with fixed nr. of iterations, choosing optimal step size)

2009-12-11 04:59:05 +00:00 · 2009-12-11 04:59:05 +00:00 · 726858145a
parent 299fcf1e04
commit 726858145a
5 changed files with 102 additions and 8 deletions
--- a/cpp/GaussianFactor.cpp
+++ b/cpp/GaussianFactor.cpp
@ -363,7 +363,7 @@ void GaussianFactor::addGradientContribution(const VectorConfig& x, VectorConfig
 	// calculate the value of the factor
 	Vector e = -b_;
  string j; Matrix Aj;
-  FOREACH_PAIR(j, Aj, As_) e += Vector(Aj * x[j]);
+  FOREACH_PAIR(j, Aj, As_) e += Aj * x[j];
  // transpose
  Vector et = trans(e);
@ -376,6 +376,24 @@ void GaussianFactor::addGradientContribution(const VectorConfig& x, VectorConfig
  }
 }
 /* ************************************************************************* */
 // Creates a factor on step-size, given initial estimate and direction d, e.g.
 // Factor |A1*x+A2*y-b|/sigma -> |A1*(x0+alpha*dx)+A2*(y0+alpha*dy)-b|/sigma
 //                            -> |(A1*dx+A2*dy)*alpha-(b-A1*x0-A2*y0)|/sigma
 /* ************************************************************************* */
 GaussianFactor::shared_ptr GaussianFactor::alphaFactor(const VectorConfig& x,
 		const VectorConfig& d) const {
 	size_t m = b_.size();
 	Vector A = zero(m); Vector b = b_;
  string j; Matrix Aj;
  FOREACH_PAIR(j, Aj, As_) {
  	A += Aj * d[j];
  	b -= Aj * x[j];
  }
 	shared_ptr factor(new GaussianFactor("alpha",Matrix_(A),b,sigmas_));
 	return factor;
 }
 /* ************************************************************************* */
 namespace gtsam {
--- a/cpp/GaussianFactor.h
+++ b/cpp/GaussianFactor.h
@ -58,6 +58,13 @@ public:
 		As_.insert(make_pair(key1, A1));
 	}
 	/** Construct unary factor with vector of sigmas*/
 	GaussianFactor(const std::string& key1, const Matrix& A1,
 			const Vector& b, const Vector& sigmas) :
 		b_(b), sigmas_(sigmas) {
 		As_.insert(make_pair(key1, A1));
 	}
 	/** Construct binary factor */
 	GaussianFactor(const std::string& key1, const Matrix& A1,
 			const std::string& key2, const Matrix& A2,
@ -207,6 +214,20 @@ public:
 	boost::tuple<std::list<int>, std::list<int>, std::list<double> >
 		sparse(const Ordering& ordering, const Dimensions& variables) const;
 	/**
 	 * Add gradient contribution to gradient config g
 	 * @param x: confif at which to evaluate gradient
 	 * @param g: I/O parameter, evolving gradient
 	 */
 	void addGradientContribution(const VectorConfig& x, VectorConfig& g) const;
 	/**
 	 * Create a GaussianFactor on one variable 'alpha' (step size), in direction d
 	 * @param x: starting point for search
 	 * @param d: search direction
 	 */
 	shared_ptr alphaFactor(const VectorConfig& x, const VectorConfig& d) const;
 	/* ************************************************************************* */
 	// MUTABLE functions. FD:on the path to being eradicated
 	/* ************************************************************************* */
@ -243,13 +264,6 @@ public:
 	 */
 	void append_factor(GaussianFactor::shared_ptr f, size_t m, size_t pos);
 	/**
 	 * Add gradient contribution to gradient config g
 	 * @param x: confif at which to evaluate gradient
 	 * @param g: I/O parameter, evolving gradient
 	 */
 	void addGradientContribution(const VectorConfig& x, VectorConfig& g) const;
 }; // GaussianFactor
 /* ************************************************************************* */
--- a/cpp/GaussianFactorGraph.cpp
+++ b/cpp/GaussianFactorGraph.cpp
@ -209,3 +209,33 @@ VectorConfig GaussianFactorGraph::gradient(const VectorConfig& x) const {
 }
 /* ************************************************************************* */
 VectorConfig GaussianFactorGraph::optimalUpdate(const VectorConfig& x,
 		const VectorConfig& d) const {
 	// create a new graph on step-size
 	GaussianFactorGraph alphaGraph;
 	BOOST_FOREACH(sharedFactor factor,factors_) {
 		sharedFactor alphaFactor = factor->alphaFactor(x,d);
 		alphaGraph.push_back(alphaFactor);
 	}
 	// solve it for optimal step-size alpha
 	GaussianConditional::shared_ptr gc = alphaGraph.eliminateOne("alpha");
 	double alpha = gc->get_d()(0);
 	// return updated estimate by stepping in direction d
  return x.exmap(d.scale(alpha));
 }
 /* ************************************************************************* */
 VectorConfig GaussianFactorGraph::gradientDescent(const VectorConfig& x0) const {
 	VectorConfig x = x0;
 	int K = 10*x.size();
 	for (int k=0;k<K;k++) {
 		VectorConfig g = gradient(x);
 		x = optimalUpdate(x,g);
 	}
 	return x;
 }
 /* ************************************************************************* */
--- a/cpp/GaussianFactorGraph.h
+++ b/cpp/GaussianFactorGraph.h
@ -162,8 +162,24 @@ namespace gtsam {
  	/**
  	 * Calculate Gradient of 0.5*|Ax-b| for a given config
  	 * @param x: VectorConfig specifying where to calculate gradient
  	 * @return gradient, as a VectorConfig as well
  	 */
  	VectorConfig gradient(const VectorConfig& x) const;
  	/**
  	 * Take an optimal step in direction d by calculating optimal step-size
  	 * @param x: starting point for search
  	 * @param d: search direction
  	 */
  	VectorConfig optimalUpdate(const VectorConfig& x0, const VectorConfig& d) const;
  	/**
  	 * Find solution using gradient descent
  	 * @param x0: VectorConfig specifying initial estimate
  	 * @return solution
  	 */
  	VectorConfig gradientDescent(const VectorConfig& x0) const;
  };
 }
--- a/cpp/testGaussianFactorGraph.cpp
+++ b/cpp/testGaussianFactorGraph.cpp
@ -565,6 +565,22 @@ TEST( GaussianFactorGraph, gradient )
 	CHECK(assert_equal(zero,actual2));
 }
 /* ************************************************************************* */
 TEST( GaussianFactorGraph, gradientDescent )
 {
 	// Expected solution
 	Ordering ord;
  ord += "x2","l1","x1";
 	GaussianFactorGraph fg = createGaussianFactorGraph();
  VectorConfig expected = fg.optimize(ord); // destructive
  // Do gradient descent
  GaussianFactorGraph fg2 = createGaussianFactorGraph();
  VectorConfig zero = createZeroDelta();
 	VectorConfig actual = fg2.gradientDescent(zero);
 	CHECK(assert_equal(expected,actual,1e-2));
 }
 /* ************************************************************************* */
 // Tests ported from ConstrainedGaussianFactorGraph
 /* ************************************************************************* */