source: src/FunctionApproximation/TrainingData.cpp@ 16227a

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since 16227a was f4496d, checked in by Frederik Heber <heber@…>, 11 years ago

Extracted associating each configuration with its L2 error into TrainingData.

  • Property mode set to 100644
File size: 7.4 KB
Line 
1/*
2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2012 University of Bonn. All rights reserved.
5 * Copyright (C) 2013 Frederik Heber. All rights reserved.
6 * Please see the COPYING file or "Copyright notice" in builder.cpp for details.
7 *
8 *
9 * This file is part of MoleCuilder.
10 *
11 * MoleCuilder is free software: you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation, either version 2 of the License, or
14 * (at your option) any later version.
15 *
16 * MoleCuilder is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
20 *
21 * You should have received a copy of the GNU General Public License
22 * along with MoleCuilder. If not, see <http://www.gnu.org/licenses/>.
23 */
24
25/*
26 * TrainingData.cpp
27 *
28 * Created on: 15.10.2012
29 * Author: heber
30 */
31
32// include config.h
33#ifdef HAVE_CONFIG_H
34#include <config.h>
35#endif
36
37#include "CodePatterns/MemDebug.hpp"
38
39#include "TrainingData.hpp"
40
41#include <algorithm>
42#include <boost/bind.hpp>
43#include <boost/foreach.hpp>
44#include <boost/lambda/lambda.hpp>
45#include <iostream>
46#include <sstream>
47
48#include "CodePatterns/Assert.hpp"
49#include "CodePatterns/Log.hpp"
50#include "CodePatterns/toString.hpp"
51
52#include "Fragmentation/Summation/SetValues/Fragment.hpp"
53#include "FunctionApproximation/FunctionArgument.hpp"
54#include "FunctionApproximation/FunctionModel.hpp"
55#include "FunctionApproximation/Extractors.hpp"
56
57void TrainingData::operator()(const range_t &range) {
58 for (HomologyContainer::const_iterator iter = range.first; iter != range.second; ++iter) {
59 const Fragment &fragment = iter->second.fragment;
60 // create internal list of arguments
61 FunctionModel::arguments_t all_args = Extractors::gatherAllSymmetricDistances(
62 fragment.getPositions(),
63 fragment.getCharges(),
64 DistanceVector.size()
65 );
66 DistanceVector.push_back( all_args );
67 const double &energy = iter->second.energy;
68 EnergyVector.push_back( FunctionModel::results_t(1, energy) );
69 // filter distances out of list of all arguments
70 FunctionModel::arguments_t args = filter(all_args);
71 LOG(3, "DEBUG: Filtered arguments are " << args << ".");
72 ArgumentVector.push_back( args );
73 }
74}
75
76const double TrainingData::getL2Error(const FunctionModel &model) const
77{
78 double L2sum = 0.;
79
80 FunctionApproximation::inputs_t::const_iterator initer = ArgumentVector.begin();
81 FunctionApproximation::outputs_t::const_iterator outiter = EnergyVector.begin();
82 for (; initer != ArgumentVector.end(); ++initer, ++outiter) {
83 const FunctionModel::results_t result = model((*initer));
84 const double temp = fabs((*outiter)[0] - result[0]);
85 L2sum += temp*temp;
86 }
87 return L2sum;
88}
89
90const double TrainingData::getLMaxError(const FunctionModel &model) const
91{
92 double Lmax = 0.;
93// size_t maxindex = -1;
94 FunctionApproximation::inputs_t::const_iterator initer = ArgumentVector.begin();
95 FunctionApproximation::outputs_t::const_iterator outiter = EnergyVector.begin();
96 for (; initer != ArgumentVector.end(); ++initer, ++outiter) {
97 const FunctionModel::results_t result = model((*initer));
98 const double temp = fabs((*outiter)[0] - result[0]);
99 if (temp > Lmax) {
100 Lmax = temp;
101// maxindex = std::distance(
102// const_cast<const FunctionApproximation::inputs_t &>(ArgumentVector).begin(),
103// initer
104// );
105 }
106 }
107 return Lmax;
108}
109
110const TrainingData::L2ErrorConfigurationIndexMap_t
111TrainingData::getWorstFragmentMap(
112 const FunctionModel &model,
113 const range_t &range) const
114{
115 TrainingData::L2ErrorConfigurationIndexMap_t WorseFragmentMap;
116 // fragments make it into the container in reversed order, hence count from top down
117 size_t index= std::distance(range.first, range.second)-1;
118 InputVector_t::const_iterator initer = ArgumentVector.begin();
119 OutputVector_t::const_iterator outiter = EnergyVector.begin();
120 for (; initer != ArgumentVector.end(); ++initer, ++outiter) {
121 // calculate value from potential
122 const FunctionModel::arguments_t &args = *initer;
123 const FunctionModel::results_t result = model(args);
124 const double energy = (*outiter)[0];
125
126 // insert difference into map
127 const double error = fabs(energy - result[0]);
128 WorseFragmentMap.insert( std::make_pair( error, index-- ) );
129
130 {
131 // give only the distances in the debugging text
132 std::stringstream streamargs;
133 BOOST_FOREACH (argument_t arg, args) {
134 streamargs << " " << arg.distance;
135 }
136 LOG(2, "DEBUG: frag.#" << index+1 << "'s error is |" << energy << " - " << result[0]
137 << "| = " << error << " for args " << streamargs.str() << ".");
138 }
139 }
140
141 return WorseFragmentMap;
142}
143
144const TrainingData::DistanceEnergyTable_t TrainingData::getDistanceEnergyTable() const
145{
146 TrainingData::DistanceEnergyTable_t table;
147
148 /// extract distance member variable from argument_t and first value from results_t
149 OutputVector_t::const_iterator ergiter = EnergyVector.begin();
150 for (InputVector_t::const_iterator iter = ArgumentVector.begin();
151 iter != ArgumentVector.end(); ++iter, ++ergiter) {
152 ASSERT( ergiter != EnergyVector.end(),
153 "TrainingData::getDistanceEnergyTable() - less output than input values.");
154 std::vector< double > values(iter->size(), 0.);
155 // transform all distances
156 const FunctionModel::arguments_t &args = *iter;
157 std::transform(
158 args.begin(), args.end(),
159 values.begin(),
160 boost::bind(&argument_t::distance, _1));
161
162 // get first energy value
163 values.push_back((*ergiter)[0]);
164
165 // push as table row
166 table.push_back(values);
167 }
168
169 return table;
170}
171
172const FunctionModel::results_t TrainingData::getTrainingOutputAverage() const
173{
174 if (EnergyVector.size() != 0) {
175 FunctionApproximation::outputs_t::const_iterator outiter = EnergyVector.begin();
176 FunctionModel::results_t result(*outiter);
177 for (++outiter; outiter != EnergyVector.end(); ++outiter)
178 for (size_t index = 0; index < (*outiter).size(); ++index)
179 result[index] += (*outiter)[index];
180 LOG(2, "DEBUG: Sum of EnergyVector is " << result << ".");
181 const double factor = 1./EnergyVector.size();
182 std::transform(result.begin(), result.end(), result.begin(),
183 boost::lambda::_1 * factor);
184 LOG(2, "DEBUG: Average EnergyVector is " << result << ".");
185 return result;
186 }
187 return FunctionModel::results_t();
188}
189
190std::ostream &operator<<(std::ostream &out, const TrainingData &data)
191{
192 const TrainingData::InputVector_t &DistanceVector = data.getAllArguments();
193 const TrainingData::OutputVector_t &EnergyVector = data.getTrainingOutputs();
194 out << "(" << DistanceVector.size()
195 << "," << EnergyVector.size() << ") data pairs: " << std::endl;
196 FunctionApproximation::inputs_t::const_iterator initer = DistanceVector.begin();
197 FunctionApproximation::outputs_t::const_iterator outiter = EnergyVector.begin();
198 for (; initer != DistanceVector.end(); ++initer, ++outiter) {
199 for (size_t index = 0; index < (*initer).size(); ++index)
200 out << "(" << (*initer)[index].indices.first << "," << (*initer)[index].indices.second
201 << ") " << (*initer)[index].distance;
202 out << " with energy ";
203 out << (*outiter);
204 out << std::endl;
205 }
206 return out;
207}
Note: See TracBrowser for help on using the repository browser.