Context Navigation

source: src/FunctionApproximation/FunctionApproximation.cpp@ 90e540

Visit:

ForceAnnealing_with_BondGraph_continued

Last change on this file since 90e540 was 6d7c73, checked in by Frederik Heber <frederik.heber@…>, 8 years ago
FIX: unnecessary output iterator present in FunctionaApproximation::evaluate().
Property mode set to `100644`
File size: 14.0 KB

Rev	Line
[66cfc7]	1	/*
	2	* Project: MoleCuilder
	3	* Description: creates and alters molecular systems
	4	* Copyright (C) 2012 University of Bonn. All rights reserved.
	5	* Please see the COPYING file or "Copyright notice" in builder.cpp for details.
	6	*
	7	*
	8	* This file is part of MoleCuilder.
	9	*
	10	* MoleCuilder is free software: you can redistribute it and/or modify
	11	* it under the terms of the GNU General Public License as published by
	12	* the Free Software Foundation, either version 2 of the License, or
	13	* (at your option) any later version.
	14	*
	15	* MoleCuilder is distributed in the hope that it will be useful,
	16	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	17	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	18	* GNU General Public License for more details.
	19	*
	20	* You should have received a copy of the GNU General Public License
	21	* along with MoleCuilder. If not, see <http://www.gnu.org/licenses/>.
	22	*/
	23
	24	/*
	25	* FunctionApproximation.cpp
	26	*
	27	* Created on: 02.10.2012
	28	* Author: heber
	29	*/
	30
	31	// include config.h
	32	#ifdef HAVE_CONFIG_H
	33	#include <config.h>
	34	#endif
	35
[9eb71b3]	36	//#include "CodePatterns/MemDebug.hpp"
[66cfc7]	37
	38	#include "FunctionApproximation.hpp"
	39
	40	#include <algorithm>
	41	#include <boost/bind.hpp>
	42	#include <boost/function.hpp>
	43	#include <iostream>
	44	#include <iterator>
	45	#include <numeric>
	46	#include <sstream>
	47
	48	#include <levmar.h>
	49
	50	#include "CodePatterns/Assert.hpp"
	51	#include "CodePatterns/Log.hpp"
	52
	53	#include "FunctionApproximation/FunctionModel.hpp"
[69ab84]	54	#include "FunctionApproximation/TrainingData.hpp"
	55
	56	FunctionApproximation::FunctionApproximation(
	57	const TrainingData &_data,
[b8f2ea]	58	FunctionModel &_model,
[b40690]	59	const double _precision,
	60	const unsigned int _maxiterations) :
[69ab84]	61	input_dimension(_data.getTrainingInputs().size()),
	62	output_dimension(_data.getTrainingOutputs().size()),
[b8f2ea]	63	precision(_precision),
[b40690]	64	maxiterations(_maxiterations),
[69ab84]	65	input_data(_data.getTrainingInputs()),
	66	output_data(_data.getTrainingOutputs()),
	67	model(_model)
	68	{}
[66cfc7]	69
[e1fe7e]	70	void FunctionApproximation::setTrainingData(const filtered_inputs_t &input, const outputs_t &output)
[66cfc7]	71	{
	72	ASSERT( input.size() == output.size(),
	73	"FunctionApproximation::setTrainingData() - the number of input and output tuples differ: "+toString(input.size())+"!="
	74	+toString(output.size())+".");
	75	if (input.size() != 0) {
	76	ASSERT( input[0].size() == input_dimension,
	77	"FunctionApproximation::setTrainingData() - the dimension of the input tuples and input dimension differ: "+toString(input[0].size())+"!="
	78	+toString(input_dimension)+".");
	79	input_data = input;
	80	ASSERT( output[0].size() == output_dimension,
	81	"FunctionApproximation::setTrainingData() - the dimension of the output tuples and output dimension differ: "+toString(output[0].size())+"!="
	82	+toString(output_dimension)+".");
	83	output_data = output;
	84	} else {
	85	ELOG(2, "Given vectors of training data are empty, clearing internal vectors accordingly.");
	86	input_data.clear();
	87	output_data.clear();
	88	}
	89	}
	90
	91	void FunctionApproximation::setModelFunction(FunctionModel &_model)
	92	{
	93	model= _model;
	94	}
	95
	96	/** Callback to circumvent boost::bind, boost::function and function pointer problem.
	97	*
	98	* See here (second answer!) to the nature of the problem:
	99	* http://stackoverflow.com/questions/282372/demote-boostfunction-to-a-plain-function-pointer
	100	*
	101	* We cannot use a boost::bind bounded boost::function as a function pointer.
	102	* boost::function::target() will just return NULL because the signature does not
	103	* match. We have to use a C-style callback function and our luck is that
	104	* the levmar signature provides for a void* additional data pointer which we
	105	* can cast back to our FunctionApproximation class, as we need access to the
	106	* data contained, e.g. the FunctionModel reference FunctionApproximation::model.
	107	*
	108	*/
	109	void FunctionApproximation::LevMarCallback(double p, double x, int m, int n, void *data)
	110	{
	111	FunctionApproximation approximator = static_cast<FunctionApproximation >(data);
	112	ASSERT( approximator != NULL,
	113	"LevMarCallback() - received data does not represent a FunctionApproximation object.");
	114	boost::function<void(double,double,int,int,void*)> function =
	115	boost::bind(&FunctionApproximation::evaluate, approximator, _1, _2, _3, _4, _5);
	116	function(p,x,m,n,data);
	117	}
	118
[5b5724]	119	void FunctionApproximation::LevMarDerivativeCallback(double p, double x, int m, int n, void *data)
	120	{
	121	FunctionApproximation approximator = static_cast<FunctionApproximation >(data);
	122	ASSERT( approximator != NULL,
	123	"LevMarDerivativeCallback() - received data does not represent a FunctionApproximation object.");
	124	boost::function<void(double,double,int,int,void*)> function =
	125	boost::bind(&FunctionApproximation::evaluateDerivative, approximator, _1, _2, _3, _4, _5);
	126	function(p,x,m,n,data);
	127	}
	128
[63b9f7]	129	void FunctionApproximation::prepareParameters(double *&p, int &m) const
[66cfc7]	130	{
	131	m = model.getParameterDimension();
	132	const FunctionModel::parameters_t params = model.getParameters();
[c62f96]	133	{
	134	p = new double[m];
	135	size_t index = 0;
[6d7c73]	136	// cannot use std::copy here because of additional dereference
[c62f96]	137	for(FunctionModel::parameters_t::const_iterator paramiter = params.begin();
	138	paramiter != params.end();
	139	++paramiter, ++index) {
	140	p[index] = *paramiter;
	141	}
	142	}
[63b9f7]	143	}
	144
	145	void FunctionApproximation::prepareOutput(double *&x, int &n) const
	146	{
	147	n = output_data.size();
[c62f96]	148	{
	149	x = new double[n];
	150	size_t index = 0;
[6d7c73]	151	// cannot use std::copy here because of additional dereference
[c62f96]	152	for(outputs_t::const_iterator outiter = output_data.begin();
	153	outiter != output_data.end();
	154	++outiter, ++index) {
	155	x[index] = (*outiter)[0];
	156	}
[66cfc7]	157	}
[63b9f7]	158	}
	159
	160	void FunctionApproximation::operator()(const enum JacobianMode mode)
	161	{
	162	// let levmar optimize
	163	register int i, j;
	164	int ret;
	165	double *p;
	166	double *x;
	167	int m, n;
	168	double opts[LM_OPTS_SZ], info[LM_INFO_SZ];
	169
[b8f2ea]	170	// minim. options [\tau, \epsilon1, \epsilon2, \epsilon3]. Respectively the scale factor for initial \mu,
	171	// * stopping thresholds for \|\|J^T e\|\|_inf, \|\|Dp\|\|_2 and \|\|e\|\|_2.
	172	opts[0]=LM_INIT_MU; opts[1]=1e-15; opts[2]=1e-15; opts[3]=precision;
[63b9f7]	173	opts[4]= LM_DIFF_DELTA; // relevant only if the Jacobian is approximated using finite differences; specifies forward differencing
	174	//opts[4]=-LM_DIFF_DELTA; // specifies central differencing to approximate Jacobian; more accurate but more expensive to compute!
	175
	176	prepareParameters(p,m);
	177	prepareOutput(x,n);
[66cfc7]	178
	179	{
	180	double work, covar;
	181	work=(double )malloc((LM_DIF_WORKSZ(m, n)+mm)*sizeof(double));
	182	if(!work){
	183	ELOG(0, "FunctionApproximation::operator() - memory allocation request failed.");
	184	return;
	185	}
	186	covar=work+LM_DIF_WORKSZ(m, n);
	187
	188	// give this pointer as additional data to construct function pointer in
	189	// LevMarCallback and call
[d03292]	190	if (model.isBoxConstraint()) {
	191	FunctionModel::parameters_t lowerbound = model.getLowerBoxConstraints();
	192	FunctionModel::parameters_t upperbound = model.getUpperBoxConstraints();
	193	double *lb = new double[m];
	194	double *ub = new double[m];
[a2a2f7]	195	for (size_t i=0;i<(size_t)m;++i) {
[d03292]	196	lb[i] = lowerbound[i];
	197	ub[i] = upperbound[i];
	198	}
	199	if (mode == FiniteDifferences) {
	200	ret=dlevmar_bc_dif(
	201	&FunctionApproximation::LevMarCallback,
[b40690]	202	p, x, m, n, lb, ub, NULL, 100, opts, info, work, covar, this); // no Jacobian, caller allocates work memory, covariance estimated
[d03292]	203	} else if (mode == ParameterDerivative) {
	204	ret=dlevmar_bc_der(
	205	&FunctionApproximation::LevMarCallback,
	206	&FunctionApproximation::LevMarDerivativeCallback,
[b40690]	207	p, x, m, n, lb, ub, NULL, 100, opts, info, work, covar, this); // no Jacobian, caller allocates work memory, covariance estimated
[d03292]	208	} else {
	209	ASSERT(0, "FunctionApproximation::operator() - Unknown jacobian method chosen.");
	210	}
	211	delete[] lb;
	212	delete[] ub;
[76e63d]	213	} else {
	214	ASSERT(0, "FunctionApproximation::operator() - Unknown jacobian method chosen.");
[d03292]	215	if (mode == FiniteDifferences) {
	216	ret=dlevmar_dif(
	217	&FunctionApproximation::LevMarCallback,
	218	p, x, m, n, 1000, opts, info, work, covar, this); // no Jacobian, caller allocates work memory, covariance estimated
	219	} else if (mode == ParameterDerivative) {
	220	ret=dlevmar_der(
	221	&FunctionApproximation::LevMarCallback,
	222	&FunctionApproximation::LevMarDerivativeCallback,
	223	p, x, m, n, 1000, opts, info, work, covar, this); // no Jacobian, caller allocates work memory, covariance estimated
	224	} else {
	225	ASSERT(0, "FunctionApproximation::operator() - Unknown jacobian method chosen.");
	226	}
[76e63d]	227	}
[66cfc7]	228
	229	{
	230	std::stringstream covar_msg;
	231	covar_msg << "Covariance of the fit:\n";
	232	for(i=0; i<m; ++i){
	233	for(j=0; j<m; ++j)
	234	covar_msg << covar[i*m+j] << " ";
	235	covar_msg << std::endl;
	236	}
	237	covar_msg << std::endl;
	238	LOG(1, "INFO: " << covar_msg.str());
	239	}
	240
	241	free(work);
	242	}
	243
	244	{
	245	std::stringstream result_msg;
	246	result_msg << "Levenberg-Marquardt returned " << ret << " in " << info[5] << " iter, reason " << info[6] << "\nSolution: ";
	247	for(i=0; i<m; ++i)
	248	result_msg << p[i] << " ";
	249	result_msg << "\n\nMinimization info:\n";
	250	std::vector<std::string> infonames(LM_INFO_SZ);
	251	infonames[0] = std::string("\|\|e\|\|_2 at initial p");
	252	infonames[1] = std::string("\|\|e\|\|_2");
	253	infonames[2] = std::string("\|\|J^T e\|\|_inf");
	254	infonames[3] = std::string("\|\|Dp\|\|_2");
	255	infonames[4] = std::string("mu/max[J^T J]_ii");
	256	infonames[5] = std::string("# iterations");
	257	infonames[6] = std::string("reason for termination");
	258	infonames[7] = std::string(" # function evaluations");
	259	infonames[8] = std::string(" # Jacobian evaluations");
	260	infonames[9] = std::string(" # linear systems solved");
	261	for(i=0; i<LM_INFO_SZ; ++i)
	262	result_msg << infonames[i] << ": " << info[i] << " ";
	263	result_msg << std::endl;
	264	LOG(1, "INFO: " << result_msg.str());
	265	}
	266
[c62f96]	267	delete[] p;
	268	delete[] x;
[66cfc7]	269	}
	270
[371c8b]	271	bool FunctionApproximation::checkParameterDerivatives()
	272	{
	273	double *p;
	274	int m;
	275	const FunctionModel::parameters_t backupparams = model.getParameters();
	276	prepareParameters(p,m);
	277	int n = output_data.size();
	278	double *err = new double[n];
	279	dlevmar_chkjac(
	280	&FunctionApproximation::LevMarCallback,
	281	&FunctionApproximation::LevMarDerivativeCallback,
	282	p, m, n, this, err);
	283	int i;
	284	for(i=0; i<n; ++i)
	285	LOG(1, "INFO: gradient " << i << ", err " << err[i] << ".");
	286	bool status = true;
	287	for(i=0; i<n; ++i)
	288	status &= err[i] > 0.5;
	289
	290	if (!status) {
	291	int faulty;
	292	ELOG(0, "At least one of the parameter derivatives are incorrect.");
	293	for (faulty=1; faulty<=m; ++faulty) {
	294	LOG(1, "INFO: Trying with only the first " << faulty << " parameters...");
	295	model.setParameters(backupparams);
	296	dlevmar_chkjac(
	297	&FunctionApproximation::LevMarCallback,
	298	&FunctionApproximation::LevMarDerivativeCallback,
	299	p, faulty, n, this, err);
	300	bool status = true;
	301	for(i=0; i<n; ++i)
	302	status &= err[i] > 0.5;
	303	for(i=0; i<n; ++i)
	304	LOG(1, "INFO: gradient(" << faulty << ") " << i << ", err " << err[i] << ".");
	305	if (!status)
	306	break;
	307	}
	308	ELOG(0, "The faulty parameter derivative is with respect to the " << faulty << " parameter.");
	309	} else
	310	LOG(1, "INFO: parameter derivatives are ok.");
	311
	312	delete[] err;
	313	delete[] p;
	314	model.setParameters(backupparams);
	315
	316	return status;
	317	}
	318
[66cfc7]	319	double SquaredDifference(const double res1, const double res2)
	320	{
	321	return (res1-res2)*(res1-res2);
	322	}
	323
[5b5724]	324	void FunctionApproximation::prepareModel(double *p, int m)
[66cfc7]	325	{
[371c8b]	326	// ASSERT( (size_t)m == model.getParameterDimension(),
	327	// "FunctionApproximation::prepareModel() - LevMar expects "+toString(m)
	328	// +" parameters but the model function expects "+toString(model.getParameterDimension())+".");
[66cfc7]	329	FunctionModel::parameters_t params(m, 0.);
	330	std::copy(p, p+m, params.begin());
	331	model.setParameters(params);
[5b5724]	332	}
	333
	334	void FunctionApproximation::evaluate(double p, double x, int m, int n, void *data)
	335	{
	336	// first set parameters
	337	prepareModel(p,m);
[66cfc7]	338
	339	// then evaluate
[5b5724]	340	ASSERT( (size_t)n == output_data.size(),
	341	"FunctionApproximation::evaluate() - LevMar expects "+toString(n)
	342	+" outputs but we provide "+toString(output_data.size())+".");
[c62f96]	343	if (!output_data.empty()) {
[e1fe7e]	344	filtered_inputs_t::const_iterator initer = input_data.begin();
[6d7c73]	345	// outputs_t::const_iterator outiter = output_data.begin();
[66cfc7]	346	size_t index = 0;
[6d7c73]	347	for (; initer != input_data.end(); ++initer /* , ++outiter */) {
[66cfc7]	348	// result may be a vector, calculate L2 norm
	349	const FunctionModel::results_t functionvalue =
	350	model(*initer);
[5b5724]	351	x[index++] = functionvalue[0];
	352	// std::vector<double> differences(functionvalue.size(), 0.);
	353	// std::transform(
	354	// functionvalue.begin(), functionvalue.end(), outiter->begin(),
	355	// differences.begin(),
	356	// &SquaredDifference);
	357	// x[index] = std::accumulate(differences.begin(), differences.end(), 0.);
	358	}
	359	}
	360	}
	361
	362	void FunctionApproximation::evaluateDerivative(double p, double jac, int m, int n, void *data)
	363	{
	364	// first set parameters
	365	prepareModel(p,m);
	366
	367	// then evaluate
	368	ASSERT( (size_t)n == output_data.size(),
	369	"FunctionApproximation::evaluateDerivative() - LevMar expects "+toString(n)
	370	+" outputs but we provide "+toString(output_data.size())+".");
	371	if (!output_data.empty()) {
[e1fe7e]	372	filtered_inputs_t::const_iterator initer = input_data.begin();
[6d7c73]	373	// outputs_t::const_iterator outiter = output_data.begin();
[5b5724]	374	size_t index = 0;
[6d7c73]	375	for (; initer != input_data.end(); ++initer /, ++outiter /) {
[5b5724]	376	// result may be a vector, calculate L2 norm
	377	for (int paramindex = 0; paramindex < m; ++paramindex) {
	378	const FunctionModel::results_t functionvalue =
	379	model.parameter_derivative(*initer, paramindex);
	380	jac[index++] = functionvalue[0];
	381	}
	382	// std::vector<double> differences(functionvalue.size(), 0.);
	383	// std::transform(
	384	// functionvalue.begin(), functionvalue.end(), outiter->begin(),
	385	// differences.begin(),
	386	// &SquaredDifference);
	387	// x[index] = std::accumulate(differences.begin(), differences.end(), 0.);
[66cfc7]	388	}
	389	}
	390	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: