source: src/LevMartester.cpp@ d76ce74

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since d76ce74 was 05f437, checked in by Frederik Heber <heber@…>, 13 years ago

LevMartester now contains three generalized fits to Angle, Morse, and Saturation potential.

  • Property mode set to 100644
File size: 13.6 KB
Line 
1/*
2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2012 University of Bonn. All rights reserved.
5 * Please see the COPYING file or "Copyright notice" in builder.cpp for details.
6 *
7 *
8 * This file is part of MoleCuilder.
9 *
10 * MoleCuilder is free software: you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation, either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * MoleCuilder is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with MoleCuilder. If not, see <http://www.gnu.org/licenses/>.
22 */
23
24/*
25 * LevMartester.cpp
26 *
27 * Created on: Sep 27, 2012
28 * Author: heber
29 */
30
31
32// include config.h
33#ifdef HAVE_CONFIG_H
34#include <config.h>
35#endif
36
37#include <boost/archive/text_iarchive.hpp>
38
39#include "CodePatterns/MemDebug.hpp"
40
41#include <boost/assign.hpp>
42#include <boost/assign/list_of.hpp>
43#include <boost/bind.hpp>
44#include <boost/filesystem.hpp>
45#include <boost/function.hpp>
46#include <boost/program_options.hpp>
47
48#include <cstdlib>
49#include <ctime>
50#include <fstream>
51#include <iostream>
52#include <iterator>
53#include <list>
54#include <vector>
55
56#include <levmar.h>
57
58#include "CodePatterns/Assert.hpp"
59#include "CodePatterns/Log.hpp"
60
61#include "LinearAlgebra/Vector.hpp"
62
63#include "Fragmentation/Homology/HomologyContainer.hpp"
64#include "Fragmentation/SetValues/Fragment.hpp"
65#include "FunctionApproximation/Extractors.hpp"
66#include "FunctionApproximation/FunctionApproximation.hpp"
67#include "FunctionApproximation/FunctionModel.hpp"
68#include "FunctionApproximation/TrainingData.hpp"
69#include "FunctionApproximation/writeDistanceEnergyTable.hpp"
70#include "Helpers/defs.hpp"
71#include "Potentials/Specifics/PairPotential_Morse.hpp"
72#include "Potentials/Specifics/PairPotential_Angle.hpp"
73#include "Potentials/Specifics/SaturationPotential.hpp"
74#include "types.hpp"
75
76namespace po = boost::program_options;
77
78using namespace boost::assign;
79
80HomologyGraph getFirstGraphwithTimesSpecificElement(
81 const HomologyContainer &homologies,
82 const size_t _number,
83 const size_t _times)
84{
85 for (HomologyContainer::container_t::const_iterator iter =
86 homologies.begin(); iter != homologies.end(); ++iter) {
87 if (iter->first.hasTimesAtomicNumber(_number,_times))
88 return iter->first;
89 }
90 return HomologyGraph();
91}
92
93/** This function returns the elements of the sum over index "k" for an
94 * argument containing indices "i" and "j"
95 * @param inputs vector of all configuration (containing each a vector of all arguments)
96 * @param arg argument containing indices "i" and "j"
97 * @param cutoff cutoff criterion for sum over k
98 * @return vector of argument pairs (a vector) of ik and jk for at least all k
99 * within distance of \a cutoff to i
100 */
101std::vector<FunctionModel::arguments_t>
102getTripleFromArgument(const FunctionApproximation::inputs_t &inputs, const argument_t &arg, const double cutoff)
103{
104 typedef std::list<argument_t> arg_list_t;
105 typedef std::map<size_t, arg_list_t > k_args_map_t;
106 k_args_map_t tempresult;
107 ASSERT( inputs.size() > arg.globalid,
108 "getTripleFromArgument() - globalid "+toString(arg.globalid)
109 +" is greater than all inputs "+toString(inputs.size())+".");
110 const FunctionModel::arguments_t &listofargs = inputs[arg.globalid];
111 for (FunctionModel::arguments_t::const_iterator argiter = listofargs.begin();
112 argiter != listofargs.end();
113 ++argiter) {
114 // first index must be either i or j but second index not
115 if (((argiter->indices.first == arg.indices.first)
116 || (argiter->indices.first == arg.indices.second))
117 && ((argiter->indices.second != arg.indices.first)
118 && (argiter->indices.second != arg.indices.second))) {
119 // we need arguments ik and jk
120 std::pair< k_args_map_t::iterator, bool> inserter =
121 tempresult.insert( std::make_pair( argiter->indices.second, arg_list_t(1,*argiter)));
122 if (!inserter.second) {
123 // is present one ik or jk, if ik insert jk at back
124 if (inserter.first->second.begin()->indices.first == arg.indices.first)
125 inserter.first->second.push_back(*argiter);
126 else // if jk, insert ik at front
127 inserter.first->second.push_front(*argiter);
128 }
129 }
130// // or second index must be either i or j but first index not
131// else if (((argiter->indices.first != arg.indices.first)
132// && (argiter->indices.first != arg.indices.second))
133// && ((argiter->indices.second == arg.indices.first)
134// || (argiter->indices.second == arg.indices.second))) {
135// // we need arguments ki and kj
136// std::pair< k_args_map_t::iterator, bool> inserter =
137// tempresult.insert( std::make_pair( argiter->indices.first, arg_list_t(1,*argiter)));
138// if (!inserter.second) {
139// // is present one ki or kj, if ki insert kj at back
140// if (inserter.first->second.begin()->indices.second == arg.indices.first)
141// inserter.first->second.push_back(*argiter);
142// else // if kj, insert ki at front
143// inserter.first->second.push_front(*argiter);
144// }
145// }
146 }
147 // check that i,j are NOT contained
148 ASSERT( tempresult.count(arg.indices.first) == 0,
149 "getTripleFromArgument() - first index of argument present in k_args_map?");
150 ASSERT( tempresult.count(arg.indices.second) == 0,
151 "getTripleFromArgument() - first index of argument present in k_args_map?");
152
153 // convert
154 std::vector<FunctionModel::arguments_t> result;
155 for (k_args_map_t::const_iterator iter = tempresult.begin();
156 iter != tempresult.end();
157 ++iter) {
158 ASSERT( iter->second.size() == 2,
159 "getTripleFromArgument() - for index "+toString(iter->first)+" we did not find both ik and jk.");
160 result.push_back( FunctionModel::arguments_t(iter->second.begin(), iter->second.end()) );
161 }
162 return result;
163}
164
165int main(int argc, char **argv)
166{
167 std::cout << "Hello to the World from LevMar!" << std::endl;
168
169 // load homology file
170 po::options_description desc("Allowed options");
171 desc.add_options()
172 ("help", "produce help message")
173 ("homology-file", po::value< boost::filesystem::path >(), "homology file to parse")
174 ;
175
176 po::variables_map vm;
177 po::store(po::parse_command_line(argc, argv, desc), vm);
178 po::notify(vm);
179
180 if (vm.count("help")) {
181 std::cout << desc << "\n";
182 return 1;
183 }
184
185 boost::filesystem::path homology_file;
186 if (vm.count("homology-file")) {
187 homology_file = vm["homology-file"].as<boost::filesystem::path>();
188 LOG(1, "INFO: Parsing " << homology_file.string() << ".");
189 } else {
190 LOG(0, "homology-file level was not set.");
191 }
192 HomologyContainer homologies;
193 if (boost::filesystem::exists(homology_file)) {
194 std::ifstream returnstream(homology_file.string().c_str());
195 if (returnstream.good()) {
196 boost::archive::text_iarchive ia(returnstream);
197 ia >> homologies;
198 } else {
199 ELOG(2, "Failed to parse from " << homology_file.string() << ".");
200 }
201 returnstream.close();
202 } else {
203 ELOG(0, homology_file << " does not exist.");
204 }
205
206 // first we try to look into the HomologyContainer
207 LOG(1, "INFO: Listing all present homologies ...");
208 for (HomologyContainer::container_t::const_iterator iter =
209 homologies.begin(); iter != homologies.end(); ++iter) {
210 LOG(1, "INFO: graph " << iter->first << " has Fragment "
211 << iter->second.first << " and associated energy " << iter->second.second << ".");
212 }
213
214 /******************** Angle TRAINING ********************/
215 FunctionModel::parameters_t angleparams(PairPotential_Angle::MAXPARAMS, 0.);
216 {
217 // then we ought to pick the right HomologyGraph ...
218 const HomologyGraph graph = getFirstGraphwithTimesSpecificElement(homologies,8,1);
219 if (graph != HomologyGraph()) {
220 LOG(1, "First representative graph containing three saturated carbons is " << graph << ".");
221
222 // Afterwards we go through all of this type and gather the distance and the energy value
223 PairPotential_Angle::ParticleTypes_t types =
224 boost::assign::list_of<PairPotential_Angle::ParticleType_t>
225 (8)(1)(1)
226 ;
227 PairPotential_Angle angle(types);
228 Fragment::charges_t h2o;
229 h2o += 8,1,1;
230 TrainingData AngleData(angle.getFragmentSpecificExtractor(h2o));
231 AngleData(homologies.getHomologousGraphs(graph));
232 LOG(1, "INFO: I gathered the following training data: " << AngleData);
233 // NOTICE that distance are in bohrradi as they come from MPQC!
234
235 // now perform the function approximation by optimizing the model function
236 FunctionModel &model = angle;
237 FunctionApproximation approximator(AngleData, model);
238 if (model.isBoxConstraint() && approximator.checkParameterDerivatives()) {
239 // we set parameters here because we want to test with default ones
240 srand((unsigned)time(0)); // seed with current time
241 model.setParametersToRandomInitialValues(AngleData);
242 LOG(0, "INFO: Initial parameters are " << angle.getParameters() << ".");
243 approximator(FunctionApproximation::ParameterDerivative);
244 } else {
245 ELOG(0, "We require parameter derivatives for a box constraint minimization.");
246 return 1;
247 }
248
249 LOG(0, "RESULT: " << angle << ".");
250
251 angleparams = model.getParameters();
252 }
253 }
254
255 /******************** MORSE TRAINING ********************/
256 FunctionModel::parameters_t morseparams(PairPotential_Morse::MAXPARAMS, 0.);
257 {
258 // then we ought to pick the right HomologyGraph ...
259 const HomologyGraph graph = getFirstGraphwithTimesSpecificElement(homologies,8,1);
260 if (graph != HomologyGraph()) {
261 LOG(1, "First representative graph containing two saturated carbons is " << graph << ".");
262
263 // Afterwards we go through all of this type and gather the distance and the energy value
264 Fragment::charges_t h2o;
265 h2o += 8,1;
266 PairPotential_Morse::ParticleTypes_t types =
267 boost::assign::list_of<PairPotential_Morse::ParticleType_t>
268 (8)(1)
269 ;
270 PairPotential_Morse morse(types);
271 TrainingData MorseData(morse.getFragmentSpecificExtractor(h2o));
272 MorseData(homologies.getHomologousGraphs(graph));
273 LOG(1, "INFO: I gathered the following training data: " << MorseData);
274 // NOTICE that distance are in bohrradi as they come from MPQC!
275
276 // now perform the function approximation by optimizing the model function
277 FunctionModel &model = morse;
278 FunctionApproximation approximator(MorseData, model); // we only give CC distance, hence 1 input dim
279 if (model.isBoxConstraint() && approximator.checkParameterDerivatives()) {
280 // we set parameters here because we want to test with default ones
281 srand((unsigned)time(0)); // seed with current time
282 model.setParametersToRandomInitialValues(MorseData);
283 LOG(0, "INFO: Initial parameters are " << morse.getParameters() << ".");
284 approximator(FunctionApproximation::ParameterDerivative);
285 } else {
286 ELOG(0, "We require parameter derivatives for a box constraint minimization.");
287 return 1;
288 }
289
290 LOG(0, "RESULT: " << morse << ".");
291
292 morseparams = model.getParameters();
293 }
294 }
295
296 /******************* SATURATION TRAINING *******************/
297 FunctionModel::parameters_t params(SaturationPotential::MAXPARAMS, 0.);
298 {
299 // then we ought to pick the right HomologyGraph ...
300 const HomologyGraph graph = getFirstGraphwithTimesSpecificElement(homologies,8,1);
301 if (graph != HomologyGraph()) {
302 LOG(1, "First representative graph containing one saturated carbon is " << graph << ".");
303
304 // Afterwards we go through all of this type and gather the distance and the energy value
305 Fragment::charges_t h2o;
306 h2o += 8,1,1;
307 SaturationPotential::ParticleTypes_t types =
308 boost::assign::list_of<SaturationPotential::ParticleType_t>
309 (8)(1)
310 ;
311 SaturationPotential saturation(types);
312 TrainingData TersoffData(saturation.getFragmentSpecificExtractor(h2o));
313 boost::function< std::vector<FunctionModel::arguments_t>(const argument_t &, const double)> triplefunction =
314 boost::bind(&getTripleFromArgument, boost::cref(TersoffData.getTrainingInputs()), _1, _2);
315 saturation.setTriplefunction(triplefunction);
316
317 TersoffData( homologies.getHomologousGraphs(graph) );
318 LOG(1, "INFO: I gathered the following training data: " << TersoffData);
319 // NOTICE that distance are in bohrradi as they come from MPQC!
320
321 // now perform the function approximation by optimizing the model function
322 FunctionModel &model = saturation;
323 FunctionApproximation approximator(TersoffData, model); // CH4 has 5 atoms, hence 5*4/2 distances
324 if (model.isBoxConstraint() && approximator.checkParameterDerivatives()) {
325 // we set parameters here because we want to test with default ones
326 srand((unsigned)time(0)); // seed with current time
327 model.setParametersToRandomInitialValues(TersoffData);
328 approximator(FunctionApproximation::ParameterDerivative);
329 } else {
330 ELOG(0, "We require parameter derivatives for a box constraint minimization.");
331 return 1;
332 }
333
334 LOG(0, "RESULT: " << saturation << ".");
335
336 // check L2 and Lmax error against training set
337 LOG(1, "INFO: L2sum = " << TersoffData.getL2Error(model)
338 << ", LMax = " << TersoffData.getLMaxError(model) << ".");
339 }
340
341 }
342
343 return 0;
344}
Note: See TracBrowser for help on using the repository browser.