source: src/molecule_fragmentation.cpp@ 15f6e9

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since 15f6e9 was 00b59d5, checked in by Frederik Heber <heber@…>, 15 years ago

FIX: molecule::FragmentMolecule() did not remove copied atoms and molecules.

  • Subgraph copies molecules, are now removed in MoleculeLeafClass dstor.
  • BondFragments's molecules, i.e. the created fragments, are not removed, hence the output file got a lot bigger ...
  • Property mode set to 100644
File size: 81.3 KB
RevLine 
[bcf653]1/*
2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2010 University of Bonn. All rights reserved.
5 * Please see the LICENSE file or "Copyright notice" in builder.cpp for details.
6 */
7
[cee0b57]8/*
9 * molecule_fragmentation.cpp
10 *
11 * Created on: Oct 5, 2009
12 * Author: heber
13 */
14
[bf3817]15// include config.h
16#ifdef HAVE_CONFIG_H
17#include <config.h>
18#endif
19
[ad011c]20#include "CodePatterns/MemDebug.hpp"
[112b09]21
[49e1ae]22#include <cstring>
23
[cbc5fb]24#include "World.hpp"
[f66195]25#include "atom.hpp"
26#include "bond.hpp"
[cee0b57]27#include "config.hpp"
[f66195]28#include "element.hpp"
[952f38]29#include "Helpers/helpers.hpp"
[f66195]30#include "lists.hpp"
[ad011c]31#include "CodePatterns/Verbose.hpp"
32#include "CodePatterns/Log.hpp"
[cee0b57]33#include "molecule.hpp"
[f66195]34#include "periodentafel.hpp"
[b34306]35#include "World.hpp"
[cca9ef]36#include "LinearAlgebra/RealSpaceMatrix.hpp"
[84c494]37#include "Box.hpp"
[cee0b57]38
39/************************************* Functions for class molecule *********************************/
40
41
42/** Estimates by educated guessing (using upper limit) the expected number of fragments.
43 * The upper limit is
44 * \f[
45 * n = N \cdot C^k
46 * \f]
47 * where \f$C=2^c\f$ and c is the maximum bond degree over N number of atoms.
48 * \param *out output stream for debugging
49 * \param order bond order k
50 * \return number n of fragments
51 */
[e138de]52int molecule::GuesstimateFragmentCount(int order)
[cee0b57]53{
[266237]54 size_t c = 0;
[cee0b57]55 int FragmentCount;
56 // get maximum bond degree
[9879f6]57 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
58 c = ((*iter)->ListOfBonds.size() > c) ? (*iter)->ListOfBonds.size() : c;
[cee0b57]59 }
60 FragmentCount = NoNonHydrogen*(1 << (c*order));
[a67d19]61 DoLog(1) && (Log() << Verbose(1) << "Upper limit for this subgraph is " << FragmentCount << " for " << NoNonHydrogen << " non-H atoms with maximum bond degree of " << c << "." << endl);
[cee0b57]62 return FragmentCount;
63};
64
65/** Scans a single line for number and puts them into \a KeySet.
66 * \param *out output stream for debugging
67 * \param *buffer buffer to scan
68 * \param &CurrentSet filled KeySet on return
69 * \return true - at least one valid atom id parsed, false - CurrentSet is empty
70 */
[e138de]71bool ScanBufferIntoKeySet(char *buffer, KeySet &CurrentSet)
[cee0b57]72{
73 stringstream line;
74 int AtomNr;
75 int status = 0;
76
77 line.str(buffer);
78 while (!line.eof()) {
79 line >> AtomNr;
[5034e1]80 if (AtomNr >= 0) {
[cee0b57]81 CurrentSet.insert(AtomNr); // insert at end, hence in same order as in file!
82 status++;
83 } // else it's "-1" or else and thus must not be added
84 }
[a67d19]85 DoLog(1) && (Log() << Verbose(1) << "The scanned KeySet is ");
[cee0b57]86 for(KeySet::iterator runner = CurrentSet.begin(); runner != CurrentSet.end(); runner++) {
[a67d19]87 DoLog(0) && (Log() << Verbose(0) << (*runner) << "\t");
[cee0b57]88 }
[a67d19]89 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]90 return (status != 0);
91};
92
93/** Parses the KeySet file and fills \a *FragmentList from the known molecule structure.
94 * Does two-pass scanning:
95 * -# Scans the keyset file and initialises a temporary graph
96 * -# Scans TEFactors file and sets the TEFactor of each key set in the temporary graph accordingly
97 * Finally, the temporary graph is inserted into the given \a FragmentList for return.
[35b698]98 * \param &path path to file
[cee0b57]99 * \param *FragmentList empty, filled on return
100 * \return true - parsing successfully, false - failure on parsing (FragmentList will be NULL)
101 */
[35b698]102bool ParseKeySetFile(std::string &path, Graph *&FragmentList)
[cee0b57]103{
104 bool status = true;
105 ifstream InputFile;
106 stringstream line;
107 GraphTestPair testGraphInsert;
108 int NumberOfFragments = 0;
[35b698]109 string filename;
[cee0b57]110
111 if (FragmentList == NULL) { // check list pointer
112 FragmentList = new Graph;
113 }
114
115 // 1st pass: open file and read
[a67d19]116 DoLog(1) && (Log() << Verbose(1) << "Parsing the KeySet file ... " << endl);
[35b698]117 filename = path + KEYSETFILE;
118 InputFile.open(filename.c_str());
119 if (InputFile.good()) {
[cee0b57]120 // each line represents a new fragment
[920c70]121 char buffer[MAXSTRINGSIZE];
[cee0b57]122 // 1. parse keysets and insert into temp. graph
123 while (!InputFile.eof()) {
124 InputFile.getline(buffer, MAXSTRINGSIZE);
125 KeySet CurrentSet;
[e138de]126 if ((strlen(buffer) > 0) && (ScanBufferIntoKeySet(buffer, CurrentSet))) { // if at least one valid atom was added, write config
[cee0b57]127 testGraphInsert = FragmentList->insert(GraphPair (CurrentSet,pair<int,double>(NumberOfFragments++,1))); // store fragment number and current factor
128 if (!testGraphInsert.second) {
[58ed4a]129 DoeLog(0) && (eLog()<< Verbose(0) << "KeySet file must be corrupt as there are two equal key sets therein!" << endl);
[e359a8]130 performCriticalExit();
[cee0b57]131 }
132 }
133 }
134 // 2. Free and done
135 InputFile.close();
136 InputFile.clear();
[0de7e8]137 DoLog(1) && (Log() << Verbose(1) << "\t ... done." << endl);
[cee0b57]138 } else {
[0de7e8]139 DoLog(1) && (Log() << Verbose(1) << "\t ... File " << filename << " not found." << endl);
[cee0b57]140 status = false;
141 }
142
[5034e1]143 return status;
144};
145
146/** Parses the TE factors file and fills \a *FragmentList from the known molecule structure.
147 * -# Scans TEFactors file and sets the TEFactor of each key set in the temporary graph accordingly
148 * \param *out output stream for debugging
149 * \param *path path to file
150 * \param *FragmentList graph whose nodes's TE factors are set on return
151 * \return true - parsing successfully, false - failure on parsing
152 */
[e138de]153bool ParseTEFactorsFile(char *path, Graph *FragmentList)
[5034e1]154{
155 bool status = true;
156 ifstream InputFile;
157 stringstream line;
158 GraphTestPair testGraphInsert;
159 int NumberOfFragments = 0;
160 double TEFactor;
[920c70]161 char filename[MAXSTRINGSIZE];
[5034e1]162
163 if (FragmentList == NULL) { // check list pointer
164 FragmentList = new Graph;
165 }
166
[cee0b57]167 // 2nd pass: open TEFactors file and read
[a67d19]168 DoLog(1) && (Log() << Verbose(1) << "Parsing the TEFactors file ... " << endl);
[cee0b57]169 sprintf(filename, "%s/%s%s", path, FRAGMENTPREFIX, TEFACTORSFILE);
170 InputFile.open(filename);
171 if (InputFile != NULL) {
172 // 3. add found TEFactors to each keyset
173 NumberOfFragments = 0;
174 for(Graph::iterator runner = FragmentList->begin();runner != FragmentList->end(); runner++) {
175 if (!InputFile.eof()) {
176 InputFile >> TEFactor;
177 (*runner).second.second = TEFactor;
[a67d19]178 DoLog(2) && (Log() << Verbose(2) << "Setting " << ++NumberOfFragments << " fragment's TEFactor to " << (*runner).second.second << "." << endl);
[cee0b57]179 } else {
180 status = false;
181 break;
182 }
183 }
184 // 4. Free and done
185 InputFile.close();
[a67d19]186 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]187 } else {
[a67d19]188 DoLog(1) && (Log() << Verbose(1) << "File " << filename << " not found." << endl);
[cee0b57]189 status = false;
190 }
191
192 return status;
193};
194
[5034e1]195/** Stores key sets to file.
196 * \param KeySetList Graph with Keysets
[35b698]197 * \param &path path to file
[cee0b57]198 * \return true - file written successfully, false - writing failed
199 */
[35b698]200bool StoreKeySetFile(Graph &KeySetList, std::string &path)
[cee0b57]201{
202 bool status = true;
[35b698]203 string line = path + KEYSETFILE;
204 ofstream output(line.c_str());
[cee0b57]205
206 // open KeySet file
[a67d19]207 DoLog(1) && (Log() << Verbose(1) << "Saving key sets of the total graph ... ");
[35b698]208 if(output.good()) {
[cee0b57]209 for(Graph::iterator runner = KeySetList.begin(); runner != KeySetList.end(); runner++) {
210 for (KeySet::iterator sprinter = (*runner).first.begin();sprinter != (*runner).first.end(); sprinter++) {
211 if (sprinter != (*runner).first.begin())
212 output << "\t";
213 output << *sprinter;
214 }
215 output << endl;
216 }
[a67d19]217 DoLog(0) && (Log() << Verbose(0) << "done." << endl);
[cee0b57]218 } else {
[58ed4a]219 DoeLog(0) && (eLog()<< Verbose(0) << "Unable to open " << line << " for writing keysets!" << endl);
[e359a8]220 performCriticalExit();
[cee0b57]221 status = false;
222 }
223 output.close();
224 output.clear();
225
[5034e1]226 return status;
227};
228
229
230/** Stores TEFactors to file.
231 * \param *out output stream for debugging
232 * \param KeySetList Graph with factors
233 * \param *path path to file
234 * \return true - file written successfully, false - writing failed
235 */
[e138de]236bool StoreTEFactorsFile(Graph &KeySetList, char *path)
[5034e1]237{
238 ofstream output;
239 bool status = true;
240 string line;
241
[cee0b57]242 // open TEFactors file
243 line = path;
244 line.append("/");
245 line += FRAGMENTPREFIX;
246 line += TEFACTORSFILE;
247 output.open(line.c_str(), ios::out);
[a67d19]248 DoLog(1) && (Log() << Verbose(1) << "Saving TEFactors of the total graph ... ");
[cee0b57]249 if(output != NULL) {
250 for(Graph::iterator runner = KeySetList.begin(); runner != KeySetList.end(); runner++)
251 output << (*runner).second.second << endl;
[a67d19]252 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]253 } else {
[a67d19]254 DoLog(1) && (Log() << Verbose(1) << "failed to open " << line << "." << endl);
[cee0b57]255 status = false;
256 }
257 output.close();
258
259 return status;
260};
261
[5034e1]262/** For a given graph, sorts KeySets into a (index, keyset) map.
263 * \param *GlobalKeySetList list of keysets with global ids (valid in "this" molecule) needed for adaptive increase
264 * \return map from index to keyset
265 */
266map<int,KeySet> * GraphToIndexedKeySet(Graph *GlobalKeySetList)
267{
268 map<int,KeySet> *IndexKeySetList = new map<int,KeySet>;
269 for(Graph::iterator runner = GlobalKeySetList->begin(); runner != GlobalKeySetList->end(); runner++) {
270 IndexKeySetList->insert( pair<int,KeySet>(runner->second.first,runner->first) );
271 }
272 return IndexKeySetList;
273};
274
275/** Inserts a (\a No, \a value) pair into the list, overwriting present one.
276 * Note if values are equal, No will decided on which is first
277 * \param *out output stream for debugging
278 * \param &AdaptiveCriteriaList list to insert into
279 * \param &IndexedKeySetList list to find key set for a given index \a No
280 * \param FragOrder current bond order of fragment
281 * \param No index of keyset
282 * \param value energy value
283 */
[e138de]284void InsertIntoAdaptiveCriteriaList(map<int, pair<double,int> > *AdaptiveCriteriaList, map<int,KeySet> &IndexKeySetList, int FragOrder, int No, double Value)
[5034e1]285{
286 map<int,KeySet>::iterator marker = IndexKeySetList.find(No); // find keyset to Frag No.
287 if (marker != IndexKeySetList.end()) { // if found
288 Value *= 1 + MYEPSILON*(*((*marker).second.begin())); // in case of equal energies this makes them not equal without changing anything actually
289 // as the smallest number in each set has always been the root (we use global id to keep the doubles away), seek smallest and insert into AtomMask
290 pair <map<int, pair<double,int> >::iterator, bool> InsertedElement = AdaptiveCriteriaList->insert( make_pair(*((*marker).second.begin()), pair<double,int>( fabs(Value), FragOrder) ));
291 map<int, pair<double,int> >::iterator PresentItem = InsertedElement.first;
292 if (!InsertedElement.second) { // this root is already present
293 if ((*PresentItem).second.second < FragOrder) // if order there is lower, update entry with higher-order term
294 //if ((*PresentItem).second.first < (*runner).first) // as higher-order terms are not always better, we skip this part (which would always include this site into adaptive increase)
295 { // if value is smaller, update value and order
296 (*PresentItem).second.first = fabs(Value);
297 (*PresentItem).second.second = FragOrder;
[a67d19]298 DoLog(2) && (Log() << Verbose(2) << "Updated element (" << (*PresentItem).first << ",[" << (*PresentItem).second.first << "," << (*PresentItem).second.second << "])." << endl);
[5034e1]299 } else {
[a67d19]300 DoLog(2) && (Log() << Verbose(2) << "Did not update element " << (*PresentItem).first << " as " << FragOrder << " is less than or equal to " << (*PresentItem).second.second << "." << endl);
[5034e1]301 }
302 } else {
[a67d19]303 DoLog(2) && (Log() << Verbose(2) << "Inserted element (" << (*PresentItem).first << ",[" << (*PresentItem).second.first << "," << (*PresentItem).second.second << "])." << endl);
[5034e1]304 }
305 } else {
[a67d19]306 DoLog(1) && (Log() << Verbose(1) << "No Fragment under No. " << No << "found." << endl);
[5034e1]307 }
308};
309
[a0064e]310/** Counts lines in file.
311 * Note we are scanning lines from current position, not from beginning.
312 * \param InputFile file to be scanned.
313 */
314int CountLinesinFile(ifstream &InputFile)
315{
316 char *buffer = new char[MAXSTRINGSIZE];
317 int lines=0;
318
319 int PositionMarker = InputFile.tellg(); // not needed as Inputfile is copied, given by value, not by ref
320 // count the number of lines, i.e. the number of fragments
321 InputFile.getline(buffer, MAXSTRINGSIZE); // skip comment lines
322 InputFile.getline(buffer, MAXSTRINGSIZE);
323 while(!InputFile.eof()) {
324 InputFile.getline(buffer, MAXSTRINGSIZE);
325 lines++;
326 }
327 InputFile.seekg(PositionMarker, ios::beg);
328 delete[](buffer);
329 return lines;
330};
331
332
[5034e1]333/** Scans the adaptive order file and insert (index, value) into map.
[35b698]334 * \param &path path to ENERGYPERFRAGMENT file (may be NULL if Order is non-negative)
[5034e1]335 * \param &IndexedKeySetList list to find key set for a given index \a No
336 * \return adaptive criteria list from file
337 */
[35b698]338map<int, pair<double,int> > * ScanAdaptiveFileIntoMap(std::string &path, map<int,KeySet> &IndexKeySetList)
[5034e1]339{
340 map<int, pair<double,int> > *AdaptiveCriteriaList = new map<int, pair<double,int> >;
341 int No = 0, FragOrder = 0;
342 double Value = 0.;
[920c70]343 char buffer[MAXSTRINGSIZE];
[35b698]344 string filename = path + ENERGYPERFRAGMENT;
345 ifstream InputFile(filename.c_str());
346
347 if (InputFile.fail()) {
348 DoeLog(1) && (eLog() << Verbose(1) << "Cannot find file " << filename << "." << endl);
349 return AdaptiveCriteriaList;
350 }
[5034e1]351
352 if (CountLinesinFile(InputFile) > 0) {
353 // each line represents a fragment root (Atom::nr) id and its energy contribution
354 InputFile.getline(buffer, MAXSTRINGSIZE); // skip comment lines
355 InputFile.getline(buffer, MAXSTRINGSIZE);
356 while(!InputFile.eof()) {
357 InputFile.getline(buffer, MAXSTRINGSIZE);
358 if (strlen(buffer) > 2) {
[e138de]359 //Log() << Verbose(2) << "Scanning: " << buffer << endl;
[5034e1]360 stringstream line(buffer);
361 line >> FragOrder;
362 line >> ws >> No;
363 line >> ws >> Value; // skip time entry
364 line >> ws >> Value;
365 No -= 1; // indices start at 1 in file, not 0
[e138de]366 //Log() << Verbose(2) << " - yields (" << No << "," << Value << ", " << FragOrder << ")" << endl;
[5034e1]367
368 // clean the list of those entries that have been superceded by higher order terms already
[e138de]369 InsertIntoAdaptiveCriteriaList(AdaptiveCriteriaList, IndexKeySetList, FragOrder, No, Value);
[5034e1]370 }
371 }
372 // close and done
373 InputFile.close();
374 InputFile.clear();
375 }
376
377 return AdaptiveCriteriaList;
378};
379
380/** Maps adaptive criteria list back onto (Value, (Root Nr., Order))
381 * (i.e. sorted by value to pick the highest ones)
382 * \param *out output stream for debugging
383 * \param &AdaptiveCriteriaList list to insert into
384 * \param *mol molecule with atoms
385 * \return remapped list
386 */
[e138de]387map<double, pair<int,int> > * ReMapAdaptiveCriteriaListToValue(map<int, pair<double,int> > *AdaptiveCriteriaList, molecule *mol)
[5034e1]388{
[9879f6]389 atom *Walker = NULL;
[5034e1]390 map<double, pair<int,int> > *FinalRootCandidates = new map<double, pair<int,int> > ;
[a67d19]391 DoLog(1) && (Log() << Verbose(1) << "Root candidate list is: " << endl);
[5034e1]392 for(map<int, pair<double,int> >::iterator runner = AdaptiveCriteriaList->begin(); runner != AdaptiveCriteriaList->end(); runner++) {
393 Walker = mol->FindAtom((*runner).first);
394 if (Walker != NULL) {
395 //if ((*runner).second.second >= Walker->AdaptiveOrder) { // only insert if this is an "active" root site for the current order
396 if (!Walker->MaxOrder) {
[a67d19]397 DoLog(2) && (Log() << Verbose(2) << "(" << (*runner).first << ",[" << (*runner).second.first << "," << (*runner).second.second << "])" << endl);
[5034e1]398 FinalRootCandidates->insert( make_pair( (*runner).second.first, pair<int,int>((*runner).first, (*runner).second.second) ) );
399 } else {
[a67d19]400 DoLog(2) && (Log() << Verbose(2) << "Excluding (" << *Walker << ", " << (*runner).first << ",[" << (*runner).second.first << "," << (*runner).second.second << "]), as it has reached its maximum order." << endl);
[5034e1]401 }
402 } else {
[58ed4a]403 DoeLog(0) && (eLog()<< Verbose(0) << "Atom No. " << (*runner).second.first << " was not found in this molecule." << endl);
[e359a8]404 performCriticalExit();
[5034e1]405 }
406 }
407 return FinalRootCandidates;
408};
409
410/** Marks all candidate sites for update if below adaptive threshold.
411 * Picks a given number of highest values and set *AtomMask to true.
412 * \param *out output stream for debugging
413 * \param *AtomMask defines true/false per global Atom::nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
414 * \param FinalRootCandidates list candidates to check
415 * \param Order desired order
416 * \param *mol molecule with atoms
417 * \return true - if update is necessary, false - not
418 */
[e138de]419bool MarkUpdateCandidates(bool *AtomMask, map<double, pair<int,int> > &FinalRootCandidates, int Order, molecule *mol)
[5034e1]420{
[9879f6]421 atom *Walker = NULL;
[5034e1]422 int No = -1;
423 bool status = false;
424 for(map<double, pair<int,int> >::iterator runner = FinalRootCandidates.upper_bound(pow(10.,Order)); runner != FinalRootCandidates.end(); runner++) {
425 No = (*runner).second.first;
426 Walker = mol->FindAtom(No);
427 //if (Walker->AdaptiveOrder < MinimumRingSize[Walker->nr]) {
[a67d19]428 DoLog(2) && (Log() << Verbose(2) << "Root " << No << " is still above threshold (10^{" << Order <<"}: " << runner->first << ", setting entry " << No << " of Atom mask to true." << endl);
[5034e1]429 AtomMask[No] = true;
430 status = true;
431 //} else
[e138de]432 //Log() << Verbose(2) << "Root " << No << " is still above threshold (10^{" << Order <<"}: " << runner->first << ", however MinimumRingSize of " << MinimumRingSize[Walker->nr] << " does not allow further adaptive increase." << endl;
[5034e1]433 }
434 return status;
435};
436
437/** print atom mask for debugging.
438 * \param *out output stream for debugging
439 * \param *AtomMask defines true/false per global Atom::nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
440 * \param AtomCount number of entries in \a *AtomMask
441 */
[e138de]442void PrintAtomMask(bool *AtomMask, int AtomCount)
[5034e1]443{
[a67d19]444 DoLog(2) && (Log() << Verbose(2) << " ");
[5034e1]445 for(int i=0;i<AtomCount;i++)
[a67d19]446 DoLog(0) && (Log() << Verbose(0) << (i % 10));
447 DoLog(0) && (Log() << Verbose(0) << endl);
448 DoLog(2) && (Log() << Verbose(2) << "Atom mask is: ");
[5034e1]449 for(int i=0;i<AtomCount;i++)
[a67d19]450 DoLog(0) && (Log() << Verbose(0) << (AtomMask[i] ? "t" : "f"));
451 DoLog(0) && (Log() << Verbose(0) << endl);
[5034e1]452};
[cee0b57]453
454/** Checks whether the OrderAtSite is still below \a Order at some site.
455 * \param *AtomMask defines true/false per global Atom::nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
456 * \param *GlobalKeySetList list of keysets with global ids (valid in "this" molecule) needed for adaptive increase
457 * \param Order desired Order if positive, desired exponent in threshold criteria if negative (0 is single-step)
458 * \param *MinimumRingSize array of max. possible order to avoid loops
[35b698]459 * \param path path to ENERGYPERFRAGMENT file (may be NULL if Order is non-negative)
[cee0b57]460 * \return true - needs further fragmentation, false - does not need fragmentation
461 */
[35b698]462bool molecule::CheckOrderAtSite(bool *AtomMask, Graph *GlobalKeySetList, int Order, int *MinimumRingSize, std::string path)
[cee0b57]463{
464 bool status = false;
465
466 // initialize mask list
[ea7176]467 for(int i=getAtomCount();i--;)
[cee0b57]468 AtomMask[i] = false;
469
470 if (Order < 0) { // adaptive increase of BondOrder per site
[ea7176]471 if (AtomMask[getAtomCount()] == true) // break after one step
[cee0b57]472 return false;
[5034e1]473
474 // transmorph graph keyset list into indexed KeySetList
475 if (GlobalKeySetList == NULL) {
[58ed4a]476 DoeLog(1) && (eLog()<< Verbose(1) << "Given global key set list (graph) is NULL!" << endl);
[5034e1]477 return false;
478 }
479 map<int,KeySet> *IndexKeySetList = GraphToIndexedKeySet(GlobalKeySetList);
480
[cee0b57]481 // parse the EnergyPerFragment file
[e138de]482 map<int, pair<double,int> > *AdaptiveCriteriaList = ScanAdaptiveFileIntoMap(path, *IndexKeySetList); // (Root No., (Value, Order)) !
[5034e1]483 if (AdaptiveCriteriaList->empty()) {
[58ed4a]484 DoeLog(2) && (eLog()<< Verbose(2) << "Unable to parse file, incrementing all." << endl);
[9879f6]485 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[cee0b57]486 #ifdef ADDHYDROGEN
[83f176]487 if ((*iter)->getType()->getAtomicNumber() != 1) // skip hydrogen
[cee0b57]488 #endif
489 {
[9879f6]490 AtomMask[(*iter)->nr] = true; // include all (non-hydrogen) atoms
[cee0b57]491 status = true;
492 }
493 }
494 }
[5034e1]495 // then map back onto (Value, (Root Nr., Order)) (i.e. sorted by value to pick the highest ones)
[e138de]496 map<double, pair<int,int> > *FinalRootCandidates = ReMapAdaptiveCriteriaListToValue(AdaptiveCriteriaList, this);
[5034e1]497
498 // pick the ones still below threshold and mark as to be adaptively updated
[e138de]499 MarkUpdateCandidates(AtomMask, *FinalRootCandidates, Order, this);
[5034e1]500
[920c70]501 delete[](IndexKeySetList);
502 delete[](AdaptiveCriteriaList);
503 delete[](FinalRootCandidates);
[cee0b57]504 } else { // global increase of Bond Order
[9879f6]505 for(molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[cee0b57]506 #ifdef ADDHYDROGEN
[83f176]507 if ((*iter)->getType()->getAtomicNumber() != 1) // skip hydrogen
[cee0b57]508 #endif
509 {
[9879f6]510 AtomMask[(*iter)->nr] = true; // include all (non-hydrogen) atoms
511 if ((Order != 0) && ((*iter)->AdaptiveOrder < Order)) // && ((*iter)->AdaptiveOrder < MinimumRingSize[(*iter)->nr]))
[cee0b57]512 status = true;
513 }
514 }
[ea7176]515 if ((!Order) && (!AtomMask[getAtomCount()])) // single stepping, just check
[cee0b57]516 status = true;
517
518 if (!status) {
519 if (Order == 0)
[a67d19]520 DoLog(1) && (Log() << Verbose(1) << "Single stepping done." << endl);
[cee0b57]521 else
[a67d19]522 DoLog(1) && (Log() << Verbose(1) << "Order at every site is already equal or above desired order " << Order << "." << endl);
[cee0b57]523 }
524 }
525
[ea7176]526 PrintAtomMask(AtomMask, getAtomCount()); // for debugging
[cee0b57]527
528 return status;
529};
530
531/** Create a SortIndex to map from atomic labels to the sequence in which the atoms are given in the config file.
532 * \param *out output stream for debugging
533 * \param *&SortIndex Mapping array of size molecule::AtomCount
534 * \return true - success, false - failure of SortIndex alloc
535 */
[e138de]536bool molecule::CreateMappingLabelsToConfigSequence(int *&SortIndex)
[cee0b57]537{
538 if (SortIndex != NULL) {
[a67d19]539 DoLog(1) && (Log() << Verbose(1) << "SortIndex is " << SortIndex << " and not NULL as expected." << endl);
[cee0b57]540 return false;
541 }
[1024cb]542 SortIndex = new int[getAtomCount()];
[ea7176]543 for(int i=getAtomCount();i--;)
[cee0b57]544 SortIndex[i] = -1;
[5034e1]545
546 int AtomNo = 0;
[32ea56]547 for(internal_iterator iter=atoms.begin();iter!=atoms.end();++iter){
548 ASSERT(SortIndex[(*iter)->nr]==-1,"Same SortIndex set twice");
549 SortIndex[(*iter)->nr] = AtomNo++;
550 }
[5034e1]551
[cee0b57]552 return true;
553};
554
[9879f6]555
556
557/** Creates a lookup table for true father's Atom::Nr -> atom ptr.
558 * \param *start begin of list (STL iterator, i.e. first item)
559 * \paran *end end of list (STL iterator, i.e. one past last item)
560 * \param **Lookuptable pointer to return allocated lookup table (should be NULL on start)
561 * \param count optional predetermined size for table (otherwise we set the count to highest true father id)
562 * \return true - success, false - failure
563 */
564bool molecule::CreateFatherLookupTable(atom **&LookupTable, int count)
565{
566 bool status = true;
567 int AtomNo;
568
569 if (LookupTable != NULL) {
570 Log() << Verbose(0) << "Pointer for Lookup table is not NULL! Aborting ..." <<endl;
571 return false;
572 }
573
574 // count them
575 if (count == 0) {
576 for (molecule::iterator iter = begin(); iter != end(); ++iter) { // create a lookup table (Atom::nr -> atom) used as a marker table lateron
577 count = (count < (*iter)->GetTrueFather()->nr) ? (*iter)->GetTrueFather()->nr : count;
578 }
579 }
580 if (count <= 0) {
581 Log() << Verbose(0) << "Count of lookup list is 0 or less." << endl;
582 return false;
583 }
584
585 // allocate and fill
[1024cb]586 LookupTable = new atom *[count];
[9879f6]587 if (LookupTable == NULL) {
588 eLog() << Verbose(0) << "LookupTable memory allocation failed!" << endl;
589 performCriticalExit();
590 status = false;
591 } else {
[1024cb]592 for (int i=0;i<count;i++)
593 LookupTable[i] = NULL;
[9879f6]594 for (molecule::iterator iter = begin(); iter != end(); ++iter) {
595 AtomNo = (*iter)->GetTrueFather()->nr;
596 if ((AtomNo >= 0) && (AtomNo < count)) {
597 //*out << "Setting LookupTable[" << AtomNo << "] to " << *(*iter) << endl;
598 LookupTable[AtomNo] = (*iter);
599 } else {
600 Log() << Verbose(0) << "Walker " << *(*iter) << " exceeded range of nuclear ids [0, " << count << ")." << endl;
601 status = false;
602 break;
603 }
604 }
605 }
606
607 return status;
608};
609
[cee0b57]610/** Performs a many-body bond order analysis for a given bond order.
611 * -# parses adjacency, keysets and orderatsite files
612 * -# performs DFS to find connected subgraphs (to leave this in was a design decision: might be useful later)
613 * -# RootStack is created for every subgraph (here, later we implement the "update 10 sites with highest energ
614y contribution", and that's why this consciously not done in the following loop)
615 * -# in a loop over all subgraphs
616 * -# calls FragmentBOSSANOVA with this RootStack and within the subgraph molecule structure
617 * -# creates molecule (fragment)s from the returned keysets (StoreFragmentFromKeySet)
618 * -# combines the generated molecule lists from all subgraphs
619 * -# saves to disk: fragment configs, adjacency, orderatsite, keyset files
620 * Note that as we split "this" molecule up into a list of subgraphs, i.e. a MoleculeListClass, we have two sets
621 * of vertex indices: Global always means the index in "this" molecule, whereas local refers to the molecule or
622 * subgraph in the MoleculeListClass.
623 * \param Order up to how many neighbouring bonds a fragment contains in BondOrderScheme::BottumUp scheme
[35b698]624 * \param &prefix path and prefix of the bond order configs to be written
[cee0b57]625 * \return 1 - continue, 2 - stop (no fragmentation occured)
626 */
[35b698]627int molecule::FragmentMolecule(int Order, std::string &prefix)
[cee0b57]628{
629 MoleculeListClass *BondFragments = NULL;
[ea7176]630 int *MinimumRingSize = new int[getAtomCount()];
[cee0b57]631 int FragmentCounter;
632 MoleculeLeafClass *MolecularWalker = NULL;
633 MoleculeLeafClass *Subgraphs = NULL; // list of subgraphs from DFS analysis
634 fstream File;
635 bool FragmentationToDo = true;
[a564be]636 std::deque<bond *> *BackEdgeStack = NULL, *LocalBackEdgeStack = NULL;
[cee0b57]637 bool CheckOrder = false;
638 Graph **FragmentList = NULL;
639 Graph *ParsedFragmentList = NULL;
640 Graph TotalGraph; // graph with all keysets however local numbers
641 int TotalNumberOfKeySets = 0;
642 atom **ListOfAtoms = NULL;
643 atom ***ListOfLocalAtoms = NULL;
644 bool *AtomMask = NULL;
645
[a67d19]646 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]647#ifdef ADDHYDROGEN
[a67d19]648 DoLog(0) && (Log() << Verbose(0) << "I will treat hydrogen special and saturate dangling bonds with it." << endl);
[cee0b57]649#else
[a67d19]650 DoLog(0) && (Log() << Verbose(0) << "Hydrogen is treated just like the rest of the lot." << endl);
[cee0b57]651#endif
652
653 // ++++++++++++++++++++++++++++ INITIAL STUFF: Bond structure analysis, file parsing, ... ++++++++++++++++++++++++++++++++++++++++++
654
655 // ===== 1. Check whether bond structure is same as stored in files ====
656
657 // create lookup table for Atom::nr
[ea7176]658 FragmentationToDo = FragmentationToDo && CreateFatherLookupTable(ListOfAtoms, getAtomCount());
[cee0b57]659
660 // === compare it with adjacency file ===
[35b698]661 FragmentationToDo = FragmentationToDo && CheckAdjacencyFileAgainstMolecule(prefix, ListOfAtoms);
[920c70]662 delete[](ListOfAtoms);
[cee0b57]663
664 // ===== 2. perform a DFS analysis to gather info on cyclic structure and a list of disconnected subgraphs =====
[e138de]665 Subgraphs = DepthFirstSearchAnalysis(BackEdgeStack);
[7218f8]666
[cee0b57]667 // analysis of the cycles (print rings, get minimum cycle length) for each subgraph
[ea7176]668 for(int i=getAtomCount();i--;)
669 MinimumRingSize[i] = getAtomCount();
[cee0b57]670 MolecularWalker = Subgraphs;
[c27778]671 const int LeafCount = Subgraphs->next->Count();
[cee0b57]672 FragmentCounter = 0;
673 while (MolecularWalker->next != NULL) {
674 MolecularWalker = MolecularWalker->next;
[7218f8]675 // fill the bond structure of the individually stored subgraphs
[c27778]676 ListOfAtoms = NULL;
677 MolecularWalker->FillBondStructureFromReference(this, ListOfAtoms, false); // we want to keep the created ListOfLocalAtoms
[a67d19]678 DoLog(0) && (Log() << Verbose(0) << "Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[a564be]679 LocalBackEdgeStack = new std::deque<bond *>; // (MolecularWalker->Leaf->BondCount);
[cee0b57]680// // check the list of local atoms for debugging
[e138de]681// Log() << Verbose(0) << "ListOfLocalAtoms for this subgraph is:" << endl;
[1024cb]682// for (int i=0;i<getAtomCount();i++)
[cee0b57]683// if (ListOfLocalAtoms[FragmentCounter][i] == NULL)
[e138de]684// Log() << Verbose(0) << "\tNULL";
[cee0b57]685// else
[e138de]686// Log() << Verbose(0) << "\t" << ListOfLocalAtoms[FragmentCounter][i]->Name;
[a67d19]687 DoLog(0) && (Log() << Verbose(0) << "Gathering local back edges for subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[c27778]688 MolecularWalker->Leaf->PickLocalBackEdges(ListOfAtoms, BackEdgeStack, LocalBackEdgeStack);
[a67d19]689 DoLog(0) && (Log() << Verbose(0) << "Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[e138de]690 MolecularWalker->Leaf->CyclicStructureAnalysis(LocalBackEdgeStack, MinimumRingSize);
[a67d19]691 DoLog(0) && (Log() << Verbose(0) << "Done with Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[cee0b57]692 delete(LocalBackEdgeStack);
[c27778]693 delete(ListOfAtoms);
694 FragmentCounter++;
[cee0b57]695 }
[7218f8]696 delete(BackEdgeStack);
[cee0b57]697
698 // ===== 3. if structure still valid, parse key set file and others =====
[35b698]699 FragmentationToDo = FragmentationToDo && ParseKeySetFile(prefix, ParsedFragmentList);
[cee0b57]700
701 // ===== 4. check globally whether there's something to do actually (first adaptivity check)
[35b698]702 FragmentationToDo = FragmentationToDo && ParseOrderAtSiteFromFile(prefix);
[cee0b57]703
704 // =================================== Begin of FRAGMENTATION ===============================
705 // ===== 6a. assign each keyset to its respective subgraph =====
[c27778]706 ListOfLocalAtoms = new atom **[LeafCount];
707 for (int i=0;i<LeafCount;i++)
708 ListOfLocalAtoms[i] = NULL;
709 FragmentCounter = 0;
710 Subgraphs->next->AssignKeySetsToFragment(this, ParsedFragmentList, ListOfLocalAtoms, FragmentList, FragmentCounter, true);
711 delete[](ListOfLocalAtoms);
[cee0b57]712
713 // ===== 6b. prepare and go into the adaptive (Order<0), single-step (Order==0) or incremental (Order>0) cycle
714 KeyStack *RootStack = new KeyStack[Subgraphs->next->Count()];
[ea7176]715 AtomMask = new bool[getAtomCount()+1];
716 AtomMask[getAtomCount()] = false;
[cee0b57]717 FragmentationToDo = false; // if CheckOrderAtSite just ones recommends fragmentation, we will save fragments afterwards
[35b698]718 while ((CheckOrder = CheckOrderAtSite(AtomMask, ParsedFragmentList, Order, MinimumRingSize, prefix))) {
[cee0b57]719 FragmentationToDo = FragmentationToDo || CheckOrder;
[ea7176]720 AtomMask[getAtomCount()] = true; // last plus one entry is used as marker that we have been through this loop once already in CheckOrderAtSite()
[cee0b57]721 // ===== 6b. fill RootStack for each subgraph (second adaptivity check) =====
[e138de]722 Subgraphs->next->FillRootStackForSubgraphs(RootStack, AtomMask, (FragmentCounter = 0));
[cee0b57]723
724 // ===== 7. fill the bond fragment list =====
725 FragmentCounter = 0;
726 MolecularWalker = Subgraphs;
727 while (MolecularWalker->next != NULL) {
728 MolecularWalker = MolecularWalker->next;
[a67d19]729 DoLog(1) && (Log() << Verbose(1) << "Fragmenting subgraph " << MolecularWalker << "." << endl);
[266237]730 //MolecularWalker->Leaf->OutputListOfBonds(out); // output atom::ListOfBonds for debugging
[e08c46]731 if (MolecularWalker->Leaf->hasBondStructure()) {
[cee0b57]732 // call BOSSANOVA method
[a67d19]733 DoLog(0) && (Log() << Verbose(0) << endl << " ========== BOND ENERGY of subgraph " << FragmentCounter << " ========================= " << endl);
[e138de]734 MolecularWalker->Leaf->FragmentBOSSANOVA(FragmentList[FragmentCounter], RootStack[FragmentCounter], MinimumRingSize);
[cee0b57]735 } else {
[58ed4a]736 DoeLog(1) && (eLog()<< Verbose(1) << "Subgraph " << MolecularWalker << " has no atoms!" << endl);
[cee0b57]737 }
738 FragmentCounter++; // next fragment list
739 }
740 }
[a67d19]741 DoLog(2) && (Log() << Verbose(2) << "CheckOrder is " << CheckOrder << "." << endl);
[cee0b57]742 delete[](RootStack);
743 delete[](AtomMask);
744 delete(ParsedFragmentList);
745 delete[](MinimumRingSize);
746
747 // ==================================== End of FRAGMENTATION ============================================
748
749 // ===== 8a. translate list into global numbers (i.e. ones that are valid in "this" molecule, not in MolecularWalker->Leaf)
[e138de]750 Subgraphs->next->TranslateIndicesToGlobalIDs(FragmentList, (FragmentCounter = 0), TotalNumberOfKeySets, TotalGraph);
[cee0b57]751
752 // free subgraph memory again
753 FragmentCounter = 0;
[00b59d5]754 while (Subgraphs != NULL) {
755 // remove entry in fragment list
756 // remove subgraph fragment
757 MolecularWalker = Subgraphs->next;
[cee0b57]758 delete(Subgraphs);
[00b59d5]759 Subgraphs = MolecularWalker;
[cee0b57]760 }
[00b59d5]761 // free fragment list
762 for (int i=0; i< FragmentCounter; ++i )
763 delete(FragmentList[i]);
[920c70]764 delete[](FragmentList);
[cee0b57]765
[00b59d5]766 DoLog(0) && (Log() << Verbose(0) << FragmentCounter-1 << " subgraph fragments have been removed." << std::endl);
767
[cee0b57]768 // ===== 8b. gather keyset lists (graphs) from all subgraphs and transform into MoleculeListClass =====
769 //if (FragmentationToDo) { // we should always store the fragments again as coordination might have changed slightly without changing bond structure
[7218f8]770 // allocate memory for the pointer array and transmorph graphs into full molecular fragments
[23b547]771 BondFragments = new MoleculeListClass(World::getPointer());
[7218f8]772 int k=0;
773 for(Graph::iterator runner = TotalGraph.begin(); runner != TotalGraph.end(); runner++) {
774 KeySet test = (*runner).first;
[a67d19]775 DoLog(0) && (Log() << Verbose(0) << "Fragment No." << (*runner).second.first << " with TEFactor " << (*runner).second.second << "." << endl);
[35b698]776 BondFragments->insert(StoreFragmentFromKeySet(test, World::getInstance().getConfig()));
[7218f8]777 k++;
778 }
[a67d19]779 DoLog(0) && (Log() << Verbose(0) << k << "/" << BondFragments->ListOfMolecules.size() << " fragments generated from the keysets." << endl);
[cee0b57]780
[7218f8]781 // ===== 9. Save fragments' configuration and keyset files et al to disk ===
782 if (BondFragments->ListOfMolecules.size() != 0) {
783 // create the SortIndex from BFS labels to order in the config file
[42af9e]784 int *SortIndex = NULL;
[e138de]785 CreateMappingLabelsToConfigSequence(SortIndex);
[cee0b57]786
[a67d19]787 DoLog(1) && (Log() << Verbose(1) << "Writing " << BondFragments->ListOfMolecules.size() << " possible bond fragmentation configs" << endl);
[35b698]788 if (BondFragments->OutputConfigForListOfFragments(prefix, SortIndex))
[a67d19]789 DoLog(1) && (Log() << Verbose(1) << "All configs written." << endl);
[7218f8]790 else
[a67d19]791 DoLog(1) && (Log() << Verbose(1) << "Some config writing failed." << endl);
[cee0b57]792
[7218f8]793 // store force index reference file
[35b698]794 BondFragments->StoreForcesFile(prefix, SortIndex);
[cee0b57]795
[7218f8]796 // store keysets file
[35b698]797 StoreKeySetFile(TotalGraph, prefix);
[cee0b57]798
[920c70]799 {
800 // store Adjacency file
[35b698]801 std::string filename = prefix + ADJACENCYFILE;
802 StoreAdjacencyToFile(filename);
[920c70]803 }
[cee0b57]804
[7218f8]805 // store Hydrogen saturation correction file
[35b698]806 BondFragments->AddHydrogenCorrection(prefix);
[cee0b57]807
[7218f8]808 // store adaptive orders into file
[35b698]809 StoreOrderAtSiteFile(prefix);
[cee0b57]810
[7218f8]811 // restore orbital and Stop values
[35b698]812 //CalculateOrbitals(*configuration);
[cee0b57]813
[7218f8]814 // free memory for bond part
[a67d19]815 DoLog(1) && (Log() << Verbose(1) << "Freeing bond memory" << endl);
[920c70]816 delete[](SortIndex);
[7218f8]817 } else {
[a67d19]818 DoLog(1) && (Log() << Verbose(1) << "FragmentList is zero on return, splitting failed." << endl);
[7218f8]819 }
[00b59d5]820 // remove all create molecules again from the World including their atoms
821 for (MoleculeList::iterator iter = BondFragments->ListOfMolecules.begin();
822 !BondFragments->ListOfMolecules.empty();
823 iter = BondFragments->ListOfMolecules.begin()) {
824 // remove copied atoms and molecule again
825 molecule *mol = *iter;
826 mol->removeAtomsinMolecule();
827 World::getInstance().destroyMolecule(mol);
828 BondFragments->ListOfMolecules.erase(iter);
829 }
[7218f8]830 delete(BondFragments);
[a67d19]831 DoLog(0) && (Log() << Verbose(0) << "End of bond fragmentation." << endl);
[cee0b57]832
833 return ((int)(!FragmentationToDo)+1); // 1 - continue, 2 - stop (no fragmentation occured)
834};
835
836
837/** Stores pairs (Atom::nr, Atom::AdaptiveOrder) into file.
838 * Atoms not present in the file get "-1".
[35b698]839 * \param &path path to file ORDERATSITEFILE
[cee0b57]840 * \return true - file writable, false - not writable
841 */
[35b698]842bool molecule::StoreOrderAtSiteFile(std::string &path)
[cee0b57]843{
[35b698]844 string line;
[cee0b57]845 ofstream file;
846
[35b698]847 line = path + ORDERATSITEFILE;
848 file.open(line.c_str());
[a67d19]849 DoLog(1) && (Log() << Verbose(1) << "Writing OrderAtSite " << ORDERATSITEFILE << " ... " << endl);
[35b698]850 if (file.good()) {
[c743f8]851 for_each(atoms.begin(),atoms.end(),bind2nd(mem_fun(&atom::OutputOrder), &file));
[cee0b57]852 file.close();
[a67d19]853 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]854 return true;
855 } else {
[35b698]856 DoLog(1) && (Log() << Verbose(1) << "failed to open file " << line << "." << endl);
[cee0b57]857 return false;
858 }
859};
860
861/** Parses pairs(Atom::nr, Atom::AdaptiveOrder) from file and stores in molecule's Atom's.
862 * Atoms not present in the file get "0".
[35b698]863 * \param &path path to file ORDERATSITEFILEe
[cee0b57]864 * \return true - file found and scanned, false - file not found
865 * \sa ParseKeySetFile() and CheckAdjacencyFileAgainstMolecule() as this is meant to be used in conjunction with the two
866 */
[35b698]867bool molecule::ParseOrderAtSiteFromFile(std::string &path)
[cee0b57]868{
[1024cb]869 unsigned char *OrderArray = new unsigned char[getAtomCount()];
870 bool *MaxArray = new bool[getAtomCount()];
[cee0b57]871 bool status;
872 int AtomNr, value;
[35b698]873 string line;
[cee0b57]874 ifstream file;
875
[1024cb]876 for(int i=0;i<getAtomCount();i++) {
[920c70]877 OrderArray[i] = 0;
878 MaxArray[i] = false;
879 }
880
[a67d19]881 DoLog(1) && (Log() << Verbose(1) << "Begin of ParseOrderAtSiteFromFile" << endl);
[35b698]882 line = path + ORDERATSITEFILE;
883 file.open(line.c_str());
884 if (file.good()) {
[cee0b57]885 while (!file.eof()) { // parse from file
886 AtomNr = -1;
887 file >> AtomNr;
888 if (AtomNr != -1) { // test whether we really parsed something (this is necessary, otherwise last atom is set twice and to 0 on second time)
889 file >> value;
890 OrderArray[AtomNr] = value;
891 file >> value;
892 MaxArray[AtomNr] = value;
[e138de]893 //Log() << Verbose(2) << "AtomNr " << AtomNr << " with order " << (int)OrderArray[AtomNr] << " and max order set to " << (int)MaxArray[AtomNr] << "." << endl;
[cee0b57]894 }
895 }
896 file.close();
[5034e1]897
898 // set atom values
[32ea56]899 for(internal_iterator iter=atoms.begin();iter!=atoms.end();++iter){
900 (*iter)->AdaptiveOrder = OrderArray[(*iter)->nr];
901 (*iter)->MaxOrder = MaxArray[(*iter)->nr];
902 }
903 //SetAtomValueToIndexedArray( OrderArray, &atom::nr, &atom::AdaptiveOrder );
904 //SetAtomValueToIndexedArray( MaxArray, &atom::nr, &atom::MaxOrder );
[5034e1]905
[0de7e8]906 DoLog(1) && (Log() << Verbose(1) << "\t ... done." << endl);
[cee0b57]907 status = true;
908 } else {
[35b698]909 DoLog(1) && (Log() << Verbose(1) << "\t ... failed to open file " << line << "." << endl);
[cee0b57]910 status = false;
911 }
[920c70]912 delete[](OrderArray);
913 delete[](MaxArray);
[cee0b57]914
[a67d19]915 DoLog(1) && (Log() << Verbose(1) << "End of ParseOrderAtSiteFromFile" << endl);
[cee0b57]916 return status;
917};
918
919
920
[a564be]921/** Looks through a std::deque<atom *> and returns the likeliest removal candiate.
[cee0b57]922 * \param *out output stream for debugging messages
923 * \param *&Leaf KeySet to look through
924 * \param *&ShortestPathList list of the shortest path to decide which atom to suggest as removal candidate in the end
925 * \param index of the atom suggested for removal
926 */
[e138de]927int molecule::LookForRemovalCandidate(KeySet *&Leaf, int *&ShortestPathList)
[cee0b57]928{
929 atom *Runner = NULL;
930 int SP, Removal;
931
[a67d19]932 DoLog(2) && (Log() << Verbose(2) << "Looking for removal candidate." << endl);
[cee0b57]933 SP = -1; //0; // not -1, so that Root is never removed
934 Removal = -1;
935 for (KeySet::iterator runner = Leaf->begin(); runner != Leaf->end(); runner++) {
936 Runner = FindAtom((*runner));
[83f176]937 if (Runner->getType()->getAtomicNumber() != 1) { // skip all those added hydrogens when re-filling snake stack
[cee0b57]938 if (ShortestPathList[(*runner)] > SP) { // remove the oldest one with longest shortest path
939 SP = ShortestPathList[(*runner)];
940 Removal = (*runner);
941 }
942 }
943 }
944 return Removal;
945};
946
[5034e1]947/** Initializes some value for putting fragment of \a *mol into \a *Leaf.
948 * \param *mol total molecule
949 * \param *Leaf fragment molecule
[cee0b57]950 * \param &Leaflet pointer to KeySet structure
[7218f8]951 * \param **SonList calloc'd list which atom of \a *Leaf is a son of which atom in \a *mol
[5034e1]952 * \return number of atoms in fragment
[cee0b57]953 */
[5034e1]954int StoreFragmentFromKeySet_Init(molecule *mol, molecule *Leaf, KeySet &Leaflet, atom **SonList)
[cee0b57]955{
[5034e1]956 atom *FatherOfRunner = NULL;
[cee0b57]957
[5034e1]958 Leaf->BondDistance = mol->BondDistance;
[cee0b57]959
960 // first create the minimal set of atoms from the KeySet
[5034e1]961 int size = 0;
[cee0b57]962 for(KeySet::iterator runner = Leaflet.begin(); runner != Leaflet.end(); runner++) {
[5034e1]963 FatherOfRunner = mol->FindAtom((*runner)); // find the id
[cee0b57]964 SonList[FatherOfRunner->nr] = Leaf->AddCopyAtom(FatherOfRunner);
965 size++;
966 }
[5034e1]967 return size;
968};
[cee0b57]969
[5034e1]970/** Creates an induced subgraph out of a fragmental key set, adding bonds and hydrogens (if treated specially).
971 * \param *out output stream for debugging messages
972 * \param *mol total molecule
973 * \param *Leaf fragment molecule
974 * \param IsAngstroem whether we have Ansgtroem or bohrradius
975 * \param **SonList list which atom of \a *Leaf is a son of which atom in \a *mol
976 */
[e138de]977void CreateInducedSubgraphOfFragment(molecule *mol, molecule *Leaf, atom **SonList, bool IsAngstroem)
[5034e1]978{
979 bool LonelyFlag = false;
980 atom *OtherFather = NULL;
981 atom *FatherOfRunner = NULL;
982
[9879f6]983#ifdef ADDHYDROGEN
984 molecule::const_iterator runner;
985#endif
[a7b761b]986 // we increment the iter just before skipping the hydrogen
987 for (molecule::const_iterator iter = Leaf->begin(); iter != Leaf->end();) {
[cee0b57]988 LonelyFlag = true;
[9879f6]989 FatherOfRunner = (*iter)->father;
[a7b761b]990 ASSERT(FatherOfRunner,"Atom without father found");
[cee0b57]991 if (SonList[FatherOfRunner->nr] != NULL) { // check if this, our father, is present in list
992 // create all bonds
[266237]993 for (BondList::const_iterator BondRunner = FatherOfRunner->ListOfBonds.begin(); BondRunner != FatherOfRunner->ListOfBonds.end(); (++BondRunner)) {
994 OtherFather = (*BondRunner)->GetOtherAtom(FatherOfRunner);
[e138de]995// Log() << Verbose(2) << "Father " << *FatherOfRunner << " of son " << *SonList[FatherOfRunner->nr] << " is bound to " << *OtherFather;
[cee0b57]996 if (SonList[OtherFather->nr] != NULL) {
[e138de]997// Log() << Verbose(0) << ", whose son is " << *SonList[OtherFather->nr] << "." << endl;
[cee0b57]998 if (OtherFather->nr > FatherOfRunner->nr) { // add bond (nr check is for adding only one of both variants: ab, ba)
[e138de]999// Log() << Verbose(3) << "Adding Bond: ";
1000// Log() << Verbose(0) <<
[9879f6]1001 Leaf->AddBond((*iter), SonList[OtherFather->nr], (*BondRunner)->BondDegree);
[e138de]1002// Log() << Verbose(0) << "." << endl;
[9879f6]1003 //NumBonds[(*iter)->nr]++;
[cee0b57]1004 } else {
[e138de]1005// Log() << Verbose(3) << "Not adding bond, labels in wrong order." << endl;
[cee0b57]1006 }
1007 LonelyFlag = false;
1008 } else {
[e138de]1009// Log() << Verbose(0) << ", who has no son in this fragment molecule." << endl;
[cee0b57]1010#ifdef ADDHYDROGEN
[9879f6]1011 //Log() << Verbose(3) << "Adding Hydrogen to " << (*iter)->Name << " and a bond in between." << endl;
1012 if(!Leaf->AddHydrogenReplacementAtom((*BondRunner), (*iter), FatherOfRunner, OtherFather, IsAngstroem))
[cee0b57]1013 exit(1);
1014#endif
[9879f6]1015 //NumBonds[(*iter)->nr] += Binder->BondDegree;
[cee0b57]1016 }
1017 }
1018 } else {
[a7b761b]1019 DoeLog(1) && (eLog()<< Verbose(1) << "Son " << (*iter)->getName() << " has father " << FatherOfRunner->getName() << " but its entry in SonList is " << SonList[FatherOfRunner->nr] << "!" << endl);
[cee0b57]1020 }
[ea7176]1021 if ((LonelyFlag) && (Leaf->getAtomCount() > 1)) {
[a7b761b]1022 DoLog(0) && (Log() << Verbose(0) << **iter << "has got bonds only to hydrogens!" << endl);
[cee0b57]1023 }
[a7b761b]1024 ++iter;
[cee0b57]1025#ifdef ADDHYDROGEN
[83f176]1026 while ((iter != Leaf->end()) && ((*iter)->getType()->getAtomicNumber() == 1)){ // skip added hydrogen
[9879f6]1027 iter++;
[a7b761b]1028 }
[cee0b57]1029#endif
1030 }
[5034e1]1031};
1032
1033/** Stores a fragment from \a KeySet into \a molecule.
1034 * First creates the minimal set of atoms from the KeySet, then creates the bond structure from the complete
1035 * molecule and adds missing hydrogen where bonds were cut.
1036 * \param *out output stream for debugging messages
1037 * \param &Leaflet pointer to KeySet structure
1038 * \param IsAngstroem whether we have Ansgtroem or bohrradius
1039 * \return pointer to constructed molecule
1040 */
[e138de]1041molecule * molecule::StoreFragmentFromKeySet(KeySet &Leaflet, bool IsAngstroem)
[5034e1]1042{
[1024cb]1043 atom **SonList = new atom*[getAtomCount()];
[23b547]1044 molecule *Leaf = World::getInstance().createMolecule();
[5034e1]1045
[1024cb]1046 for(int i=0;i<getAtomCount();i++)
[920c70]1047 SonList[i] = NULL;
1048
[e138de]1049// Log() << Verbose(1) << "Begin of StoreFragmentFromKeyset." << endl;
[5034e1]1050 StoreFragmentFromKeySet_Init(this, Leaf, Leaflet, SonList);
1051 // create the bonds between all: Make it an induced subgraph and add hydrogen
[e138de]1052// Log() << Verbose(2) << "Creating bonds from father graph (i.e. induced subgraph creation)." << endl;
1053 CreateInducedSubgraphOfFragment(this, Leaf, SonList, IsAngstroem);
[5034e1]1054
[cee0b57]1055 //Leaflet->Leaf->ScanForPeriodicCorrection(out);
[920c70]1056 delete[](SonList);
[e138de]1057// Log() << Verbose(1) << "End of StoreFragmentFromKeyset." << endl;
[cee0b57]1058 return Leaf;
1059};
1060
[d2943b]1061
1062/** Clears the touched list
1063 * \param *out output stream for debugging
1064 * \param verbosity verbosity level
1065 * \param *&TouchedList touched list
1066 * \param SubOrder current suborder
1067 * \param TouchedIndex currently touched
1068 */
[e138de]1069void SPFragmentGenerator_ClearingTouched(int verbosity, int *&TouchedList, int SubOrder, int &TouchedIndex)
[d2943b]1070{
[e138de]1071 Log() << Verbose(1+verbosity) << "Clearing touched list." << endl;
[d2943b]1072 for (TouchedIndex=SubOrder+1;TouchedIndex--;) // empty touched list
1073 TouchedList[TouchedIndex] = -1;
1074 TouchedIndex = 0;
1075
1076}
1077
1078/** Adds the current combination of the power set to the snake stack.
1079 * \param *out output stream for debugging
1080 * \param verbosity verbosity level
1081 * \param CurrentCombination
1082 * \param SetDimension maximum number of bits in power set
1083 * \param *FragmentSet snake stack to remove from
1084 * \param *&TouchedList touched list
1085 * \param TouchedIndex currently touched
1086 * \return number of set bits
1087 */
[e138de]1088int AddPowersetToSnakeStack(int verbosity, int CurrentCombination, int SetDimension, KeySet *FragmentSet, bond **BondsSet, int *&TouchedList, int &TouchedIndex)
[d2943b]1089{
1090 atom *OtherWalker = NULL;
1091 bool bit = false;
1092 KeySetTestPair TestKeySetInsert;
1093
1094 int Added = 0;
1095 for (int j=0;j<SetDimension;j++) { // pull out every bit by shifting
1096 bit = ((CurrentCombination & (1 << j)) != 0); // mask the bit for the j-th bond
1097 if (bit) { // if bit is set, we add this bond partner
1098 OtherWalker = BondsSet[j]->rightatom; // rightatom is always the one more distant, i.e. the one to add
[e138de]1099 //Log() << Verbose(1+verbosity) << "Current Bond is " << BondsSet[j] << ", checking on " << *OtherWalker << "." << endl;
1100 Log() << Verbose(2+verbosity) << "Adding " << *OtherWalker << " with nr " << OtherWalker->nr << "." << endl;
[d2943b]1101 TestKeySetInsert = FragmentSet->insert(OtherWalker->nr);
1102 if (TestKeySetInsert.second) {
1103 TouchedList[TouchedIndex++] = OtherWalker->nr; // note as added
1104 Added++;
1105 } else {
[e138de]1106 Log() << Verbose(2+verbosity) << "This was item was already present in the keyset." << endl;
[d2943b]1107 }
1108 } else {
[e138de]1109 Log() << Verbose(2+verbosity) << "Not adding." << endl;
[d2943b]1110 }
1111 }
1112 return Added;
1113};
1114
1115/** Counts the number of elements in a power set.
1116 * \param *SetFirst
1117 * \param *SetLast
1118 * \param *&TouchedList touched list
1119 * \param TouchedIndex currently touched
1120 * \return number of elements
1121 */
1122int CountSetMembers(bond *SetFirst, bond *SetLast, int *&TouchedList, int TouchedIndex)
1123{
1124 int SetDimension = 0;
1125 bond *Binder = SetFirst; // start node for this level
1126 while (Binder->next != SetLast) { // compare to end node of this level
1127 Binder = Binder->next;
1128 for (int k=TouchedIndex;k--;) {
1129 if (Binder->Contains(TouchedList[k])) // if we added this very endpiece
1130 SetDimension++;
1131 }
1132 }
1133 return SetDimension;
1134};
1135
1136/** Counts the number of elements in a power set.
1137 * \param *BondsList bonds list to fill
1138 * \param *SetFirst
1139 * \param *SetLast
1140 * \param *&TouchedList touched list
1141 * \param TouchedIndex currently touched
1142 * \return number of elements
1143 */
1144int FillBondsList(bond **BondsList, bond *SetFirst, bond *SetLast, int *&TouchedList, int TouchedIndex)
1145{
1146 int SetDimension = 0;
1147 bond *Binder = SetFirst; // start node for this level
1148 while (Binder->next != SetLast) { // compare to end node of this level
1149 Binder = Binder->next;
1150 for (int k=0;k<TouchedIndex;k++) {
1151 if (Binder->leftatom->nr == TouchedList[k]) // leftatom is always the close one
1152 BondsList[SetDimension++] = Binder;
1153 }
1154 }
1155 return SetDimension;
1156};
1157
1158/** Remove all items that were added on this SP level.
1159 * \param *out output stream for debugging
1160 * \param verbosity verbosity level
1161 * \param *FragmentSet snake stack to remove from
1162 * \param *&TouchedList touched list
1163 * \param TouchedIndex currently touched
1164 */
[e138de]1165void RemoveAllTouchedFromSnakeStack(int verbosity, KeySet *FragmentSet, int *&TouchedList, int &TouchedIndex)
[d2943b]1166{
1167 int Removal = 0;
1168 for(int j=0;j<TouchedIndex;j++) {
1169 Removal = TouchedList[j];
[e138de]1170 Log() << Verbose(2+verbosity) << "Removing item nr. " << Removal << " from snake stack." << endl;
[d2943b]1171 FragmentSet->erase(Removal);
1172 TouchedList[j] = -1;
1173 }
[a67d19]1174 DoLog(2) && (Log() << Verbose(2) << "Remaining local nr.s on snake stack are: ");
[d2943b]1175 for(KeySet::iterator runner = FragmentSet->begin(); runner != FragmentSet->end(); runner++)
[a67d19]1176 DoLog(0) && (Log() << Verbose(0) << (*runner) << " ");
1177 DoLog(0) && (Log() << Verbose(0) << endl);
[d2943b]1178 TouchedIndex = 0; // set Index to 0 for list of atoms added on this level
1179};
1180
[cee0b57]1181/** From a given set of Bond sorted by Shortest Path distance, create all possible fragments of size \a SetDimension.
1182 * -# loops over every possible combination (2^dimension of edge set)
1183 * -# inserts current set, if there's still space left
1184 * -# yes: calls SPFragmentGenerator with structure, created new edge list and size respective to root dist
1185ance+1
1186 * -# no: stores fragment into keyset list by calling InsertFragmentIntoGraph
1187 * -# removes all items added into the snake stack (in UniqueFragments structure) added during level (root
1188distance) and current set
1189 * \param *out output stream for debugging
1190 * \param FragmentSearch UniqueFragments structure with all values needed
1191 * \param RootDistance current shortest path level, whose set of edges is represented by **BondsSet
1192 * \param SetDimension Number of possible bonds on this level (i.e. size of the array BondsSet[])
1193 * \param SubOrder remaining number of allowed vertices to add
1194 */
[e138de]1195void molecule::SPFragmentGenerator(struct UniqueFragments *FragmentSearch, int RootDistance, bond **BondsSet, int SetDimension, int SubOrder)
[cee0b57]1196{
1197 int verbosity = 0; //FragmentSearch->ANOVAOrder-SubOrder;
1198 int NumCombinations;
1199 int bits, TouchedIndex, SubSetDimension, SP, Added;
1200 int SpaceLeft;
[920c70]1201 int *TouchedList = new int[SubOrder + 1];
[cee0b57]1202 KeySetTestPair TestKeySetInsert;
1203
1204 NumCombinations = 1 << SetDimension;
1205
[266237]1206 // here for all bonds of Walker all combinations of end pieces (from the bonds)
1207 // have to be added and for the remaining ANOVA order GraphCrawler be called
1208 // recursively for the next level
[cee0b57]1209
[e138de]1210 Log() << Verbose(1+verbosity) << "Begin of SPFragmentGenerator." << endl;
1211 Log() << Verbose(1+verbosity) << "We are " << RootDistance << " away from Root, which is " << *FragmentSearch->Root << ", SubOrder is " << SubOrder << ", SetDimension is " << SetDimension << " and this means " << NumCombinations-1 << " combination(s)." << endl;
[cee0b57]1212
1213 // initialised touched list (stores added atoms on this level)
[e138de]1214 SPFragmentGenerator_ClearingTouched(verbosity, TouchedList, SubOrder, TouchedIndex);
[cee0b57]1215
1216 // create every possible combination of the endpieces
[e138de]1217 Log() << Verbose(1+verbosity) << "Going through all combinations of the power set." << endl;
[cee0b57]1218 for (int i=1;i<NumCombinations;i++) { // sweep through all power set combinations (skip empty set!)
1219 // count the set bit of i
1220 bits = 0;
1221 for (int j=SetDimension;j--;)
1222 bits += (i & (1 << j)) >> j;
1223
[e138de]1224 Log() << Verbose(1+verbosity) << "Current set is " << Binary(i | (1 << SetDimension)) << ", number of bits is " << bits << "." << endl;
[cee0b57]1225 if (bits <= SubOrder) { // if not greater than additional atoms allowed on stack, continue
1226 // --1-- add this set of the power set of bond partners to the snake stack
[e138de]1227 Added = AddPowersetToSnakeStack(verbosity, i, SetDimension, FragmentSearch->FragmentSet, BondsSet, TouchedList, TouchedIndex);
[cee0b57]1228
1229 SpaceLeft = SubOrder - Added ;// SubOrder - bits; // due to item's maybe being already present, this does not work anymore
1230 if (SpaceLeft > 0) {
[e138de]1231 Log() << Verbose(1+verbosity) << "There's still some space left on stack: " << SpaceLeft << "." << endl;
[cee0b57]1232 if (SubOrder > 1) { // Due to Added above we have to check extra whether we're not already reaching beyond the desired Order
1233 // --2-- look at all added end pieces of this combination, construct bond subsets and sweep through a power set of these by recursion
1234 SP = RootDistance+1; // this is the next level
[d2943b]1235
[cee0b57]1236 // first count the members in the subset
[d2943b]1237 SubSetDimension = CountSetMembers(FragmentSearch->BondsPerSPList[2*SP], FragmentSearch->BondsPerSPList[2*SP+1], TouchedList, TouchedIndex);
1238
[cee0b57]1239 // then allocate and fill the list
[920c70]1240 bond *BondsList[SubSetDimension];
[d2943b]1241 SubSetDimension = FillBondsList(BondsList, FragmentSearch->BondsPerSPList[2*SP], FragmentSearch->BondsPerSPList[2*SP+1], TouchedList, TouchedIndex);
1242
1243 // then iterate
[e138de]1244 Log() << Verbose(2+verbosity) << "Calling subset generator " << SP << " away from root " << *FragmentSearch->Root << " with sub set dimension " << SubSetDimension << "." << endl;
1245 SPFragmentGenerator(FragmentSearch, SP, BondsList, SubSetDimension, SubOrder-bits);
[cee0b57]1246 }
1247 } else {
1248 // --2-- otherwise store the complete fragment
[e138de]1249 Log() << Verbose(1+verbosity) << "Enough items on stack for a fragment!" << endl;
[cee0b57]1250 // store fragment as a KeySet
[a67d19]1251 DoLog(2) && (Log() << Verbose(2) << "Found a new fragment[" << FragmentSearch->FragmentCounter << "], local nr.s are: ");
[cee0b57]1252 for(KeySet::iterator runner = FragmentSearch->FragmentSet->begin(); runner != FragmentSearch->FragmentSet->end(); runner++)
[a67d19]1253 DoLog(0) && (Log() << Verbose(0) << (*runner) << " ");
1254 DoLog(0) && (Log() << Verbose(0) << endl);
[e138de]1255 //if (!CheckForConnectedSubgraph(FragmentSearch->FragmentSet))
[58ed4a]1256 //DoeLog(1) && (eLog()<< Verbose(1) << "The found fragment is not a connected subgraph!" << endl);
[e138de]1257 InsertFragmentIntoGraph(FragmentSearch);
[cee0b57]1258 }
1259
1260 // --3-- remove all added items in this level from snake stack
[e138de]1261 Log() << Verbose(1+verbosity) << "Removing all items that were added on this SP level " << RootDistance << "." << endl;
1262 RemoveAllTouchedFromSnakeStack(verbosity, FragmentSearch->FragmentSet, TouchedList, TouchedIndex);
[cee0b57]1263 } else {
[e138de]1264 Log() << Verbose(2+verbosity) << "More atoms to add for this set (" << bits << ") than space left on stack " << SubOrder << ", skipping this set." << endl;
[cee0b57]1265 }
1266 }
[920c70]1267 delete[](TouchedList);
[e138de]1268 Log() << Verbose(1+verbosity) << "End of SPFragmentGenerator, " << RootDistance << " away from Root " << *FragmentSearch->Root << " and SubOrder is " << SubOrder << "." << endl;
[cee0b57]1269};
1270
[407536]1271/** Allocates memory for UniqueFragments::BondsPerSPList.
1272 * \param *out output stream
1273 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1274 * \param FragmentSearch UniqueFragments
1275 * \sa FreeSPList()
1276 */
[e138de]1277void InitialiseSPList(int Order, struct UniqueFragments &FragmentSearch)
[407536]1278{
[920c70]1279 FragmentSearch.BondsPerSPList = new bond* [Order * 2];
1280 FragmentSearch.BondsPerSPCount = new int[Order];
[407536]1281 for (int i=Order;i--;) {
1282 FragmentSearch.BondsPerSPList[2*i] = new bond(); // start node
1283 FragmentSearch.BondsPerSPList[2*i+1] = new bond(); // end node
1284 FragmentSearch.BondsPerSPList[2*i]->next = FragmentSearch.BondsPerSPList[2*i+1]; // intertwine these two
1285 FragmentSearch.BondsPerSPList[2*i+1]->previous = FragmentSearch.BondsPerSPList[2*i];
1286 FragmentSearch.BondsPerSPCount[i] = 0;
1287 }
1288};
1289
1290/** Free's memory for for UniqueFragments::BondsPerSPList.
1291 * \param *out output stream
1292 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1293 * \param FragmentSearch UniqueFragments\
1294 * \sa InitialiseSPList()
1295 */
[e138de]1296void FreeSPList(int Order, struct UniqueFragments &FragmentSearch)
[407536]1297{
[920c70]1298 delete[](FragmentSearch.BondsPerSPCount);
[407536]1299 for (int i=Order;i--;) {
1300 delete(FragmentSearch.BondsPerSPList[2*i]);
1301 delete(FragmentSearch.BondsPerSPList[2*i+1]);
1302 }
[920c70]1303 delete[](FragmentSearch.BondsPerSPList);
[407536]1304};
1305
1306/** Sets FragmenSearch to initial value.
[14e73a]1307 * Sets UniqueFragments::ShortestPathList entries to zero, UniqueFragments::BondsPerSPCount to zero (except zero level to 1) and
1308 * adds initial bond UniqueFragments::Root to UniqueFragments::Root to UniqueFragments::BondsPerSPList
1309 * \param *out output stream
[cee0b57]1310 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
[14e73a]1311 * \param FragmentSearch UniqueFragments
1312 * \sa FreeSPList()
[cee0b57]1313 */
[e138de]1314void SetSPList(int Order, struct UniqueFragments &FragmentSearch)
[cee0b57]1315{
1316 // prepare Label and SP arrays of the BFS search
1317 FragmentSearch.ShortestPathList[FragmentSearch.Root->nr] = 0;
1318
1319 // prepare root level (SP = 0) and a loop bond denoting Root
[93d120]1320 for (int i=Order;i--;)
[cee0b57]1321 FragmentSearch.BondsPerSPCount[i] = 0;
1322 FragmentSearch.BondsPerSPCount[0] = 1;
[14e73a]1323 bond *Binder = new bond(FragmentSearch.Root, FragmentSearch.Root);
[cee0b57]1324 add(Binder, FragmentSearch.BondsPerSPList[1]);
[14e73a]1325};
[cee0b57]1326
[14e73a]1327/** Resets UniqueFragments::ShortestPathList and cleans bonds from UniqueFragments::BondsPerSPList.
1328 * \param *out output stream
1329 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1330 * \param FragmentSearch UniqueFragments
1331 * \sa InitialiseSPList()
1332 */
[e138de]1333void ResetSPList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1334{
1335 bond *Binder = NULL;
[a67d19]1336 DoLog(0) && (Log() << Verbose(0) << "Free'ing all found lists. and resetting index lists" << endl);
[14e73a]1337 for(int i=Order;i--;) {
[a67d19]1338 DoLog(1) && (Log() << Verbose(1) << "Current SP level is " << i << ": ");
[14e73a]1339 Binder = FragmentSearch.BondsPerSPList[2*i];
1340 while (Binder->next != FragmentSearch.BondsPerSPList[2*i+1]) {
1341 Binder = Binder->next;
[e138de]1342 // Log() << Verbose(0) << "Removing atom " << Binder->leftatom->nr << " and " << Binder->rightatom->nr << "." << endl; // make sure numbers are local
[14e73a]1343 FragmentSearch.ShortestPathList[Binder->leftatom->nr] = -1;
1344 FragmentSearch.ShortestPathList[Binder->rightatom->nr] = -1;
1345 }
1346 // delete added bonds
1347 cleanup(FragmentSearch.BondsPerSPList[2*i], FragmentSearch.BondsPerSPList[2*i+1]);
1348 // also start and end node
[a67d19]1349 DoLog(0) && (Log() << Verbose(0) << "cleaned." << endl);
[14e73a]1350 }
1351};
1352
1353
1354/** Fills the Bonds per Shortest Path List and set the vertex labels.
1355 * \param *out output stream
1356 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1357 * \param FragmentSearch UniqueFragments
1358 * \param *mol molecule with atoms and bonds
1359 * \param RestrictedKeySet Restricted vertex set to use in context of molecule
1360 */
[e138de]1361void FillSPListandLabelVertices(int Order, struct UniqueFragments &FragmentSearch, molecule *mol, KeySet RestrictedKeySet)
[14e73a]1362{
[cee0b57]1363 // Actually, we should construct a spanning tree vom the root atom and select all edges therefrom and put them into
1364 // according shortest path lists. However, we don't. Rather we fill these lists right away, as they do form a spanning
1365 // tree already sorted into various SP levels. That's why we just do loops over the depth (CurrentSP) and breadth
1366 // (EdgeinSPLevel) of this tree ...
1367 // In another picture, the bonds always contain a direction by rightatom being the one more distant from root and hence
1368 // naturally leftatom forming its predecessor, preventing the BFS"seeker" from continuing in the wrong direction.
[14e73a]1369 int AtomKeyNr = -1;
1370 atom *Walker = NULL;
1371 atom *OtherWalker = NULL;
1372 atom *Predecessor = NULL;
1373 bond *CurrentEdge = NULL;
[266237]1374 bond *Binder = NULL;
[14e73a]1375 int RootKeyNr = FragmentSearch.Root->GetTrueFather()->nr;
1376 int RemainingWalkers = -1;
1377 int SP = -1;
1378
[a67d19]1379 DoLog(0) && (Log() << Verbose(0) << "Starting BFS analysis ..." << endl);
[cee0b57]1380 for (SP = 0; SP < (Order-1); SP++) {
[a67d19]1381 DoLog(1) && (Log() << Verbose(1) << "New SP level reached: " << SP << ", creating new SP list with " << FragmentSearch.BondsPerSPCount[SP] << " item(s)");
[cee0b57]1382 if (SP > 0) {
[a67d19]1383 DoLog(0) && (Log() << Verbose(0) << ", old level closed with " << FragmentSearch.BondsPerSPCount[SP-1] << " item(s)." << endl);
[cee0b57]1384 FragmentSearch.BondsPerSPCount[SP] = 0;
1385 } else
[a67d19]1386 DoLog(0) && (Log() << Verbose(0) << "." << endl);
[cee0b57]1387
1388 RemainingWalkers = FragmentSearch.BondsPerSPCount[SP];
1389 CurrentEdge = FragmentSearch.BondsPerSPList[2*SP]; /// start of this SP level's list
1390 while (CurrentEdge->next != FragmentSearch.BondsPerSPList[2*SP+1]) { /// end of this SP level's list
1391 CurrentEdge = CurrentEdge->next;
1392 RemainingWalkers--;
1393 Walker = CurrentEdge->rightatom; // rightatom is always the one more distant
1394 Predecessor = CurrentEdge->leftatom; // ... and leftatom is predecessor
1395 AtomKeyNr = Walker->nr;
[a67d19]1396 DoLog(0) && (Log() << Verbose(0) << "Current Walker is: " << *Walker << " with nr " << Walker->nr << " and SP of " << SP << ", with " << RemainingWalkers << " remaining walkers on this level." << endl);
[cee0b57]1397 // check for new sp level
1398 // go through all its bonds
[a67d19]1399 DoLog(1) && (Log() << Verbose(1) << "Going through all bonds of Walker." << endl);
[266237]1400 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1401 OtherWalker = (*Runner)->GetOtherAtom(Walker);
[cee0b57]1402 if ((RestrictedKeySet.find(OtherWalker->nr) != RestrictedKeySet.end())
1403 #ifdef ADDHYDROGEN
[83f176]1404 && (OtherWalker->getType()->getAtomicNumber() != 1)
[cee0b57]1405 #endif
1406 ) { // skip hydrogens and restrict to fragment
[a67d19]1407 DoLog(2) && (Log() << Verbose(2) << "Current partner is " << *OtherWalker << " with nr " << OtherWalker->nr << " in bond " << *(*Runner) << "." << endl);
[cee0b57]1408 // set the label if not set (and push on root stack as well)
1409 if ((OtherWalker != Predecessor) && (OtherWalker->GetTrueFather()->nr > RootKeyNr)) { // only pass through those with label bigger than Root's
1410 FragmentSearch.ShortestPathList[OtherWalker->nr] = SP+1;
[a67d19]1411 DoLog(3) && (Log() << Verbose(3) << "Set Shortest Path to " << FragmentSearch.ShortestPathList[OtherWalker->nr] << "." << endl);
[cee0b57]1412 // add the bond in between to the SP list
1413 Binder = new bond(Walker, OtherWalker); // create a new bond in such a manner, that bond::rightatom is always the one more distant
1414 add(Binder, FragmentSearch.BondsPerSPList[2*(SP+1)+1]);
1415 FragmentSearch.BondsPerSPCount[SP+1]++;
[a67d19]1416 DoLog(3) && (Log() << Verbose(3) << "Added its bond to SP list, having now " << FragmentSearch.BondsPerSPCount[SP+1] << " item(s)." << endl);
[cee0b57]1417 } else {
1418 if (OtherWalker != Predecessor)
[a67d19]1419 DoLog(3) && (Log() << Verbose(3) << "Not passing on, as index of " << *OtherWalker << " " << OtherWalker->GetTrueFather()->nr << " is smaller than that of Root " << RootKeyNr << "." << endl);
[cee0b57]1420 else
[a67d19]1421 DoLog(3) && (Log() << Verbose(3) << "This is my predecessor " << *Predecessor << "." << endl);
[cee0b57]1422 }
[e138de]1423 } else Log() << Verbose(2) << "Is not in the restricted keyset or skipping hydrogen " << *OtherWalker << "." << endl;
[cee0b57]1424 }
1425 }
1426 }
[14e73a]1427};
[cee0b57]1428
[14e73a]1429/** prints the Bonds per Shortest Path list in UniqueFragments.
1430 * \param *out output stream
1431 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1432 * \param FragmentSearch UniqueFragments
1433 */
[e138de]1434void OutputSPList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1435{
1436 bond *Binder = NULL;
[a67d19]1437 DoLog(0) && (Log() << Verbose(0) << "Printing all found lists." << endl);
[cee0b57]1438 for(int i=1;i<Order;i++) { // skip the root edge in the printing
1439 Binder = FragmentSearch.BondsPerSPList[2*i];
[a67d19]1440 DoLog(1) && (Log() << Verbose(1) << "Current SP level is " << i << "." << endl);
[cee0b57]1441 while (Binder->next != FragmentSearch.BondsPerSPList[2*i+1]) {
1442 Binder = Binder->next;
[a67d19]1443 DoLog(2) && (Log() << Verbose(2) << *Binder << endl);
[cee0b57]1444 }
1445 }
[14e73a]1446};
[cee0b57]1447
[14e73a]1448/** Simply counts all bonds in all UniqueFragments::BondsPerSPList lists.
1449 * \param *out output stream
1450 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1451 * \param FragmentSearch UniqueFragments
1452 */
[e138de]1453int CountNumbersInBondsList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1454{
1455 bond *Binder = NULL;
1456 int SP = -1; // the Root <-> Root edge must be subtracted!
[cee0b57]1457 for(int i=Order;i--;) { // sum up all found edges
1458 Binder = FragmentSearch.BondsPerSPList[2*i];
1459 while (Binder->next != FragmentSearch.BondsPerSPList[2*i+1]) {
1460 Binder = Binder->next;
[93d120]1461 SP++;
[cee0b57]1462 }
1463 }
[14e73a]1464 return SP;
1465};
1466
1467/** Creates a list of all unique fragments of certain vertex size from a given graph \a Fragment for a given root vertex in the context of \a this molecule.
1468 * -# initialises UniqueFragments structure
1469 * -# fills edge list via BFS
1470 * -# creates the fragment by calling recursive function SPFragmentGenerator with UniqueFragments structure, 0 as
1471 root distance, the edge set, its dimension and the current suborder
1472 * -# Free'ing structure
1473 * Note that we may use the fact that the atoms are SP-ordered on the atomstack. I.e. when popping always the last, we first get all
1474 * with SP of 2, then those with SP of 3, then those with SP of 4 and so on.
1475 * \param *out output stream for debugging
1476 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1477 * \param FragmentSearch UniqueFragments structure containing TEFactor, root atom and so on
1478 * \param RestrictedKeySet Restricted vertex set to use in context of molecule
1479 * \return number of inserted fragments
1480 * \note ShortestPathList in FragmentSearch structure is probably due to NumberOfAtomsSPLevel and SP not needed anymore
1481 */
[e138de]1482int molecule::PowerSetGenerator(int Order, struct UniqueFragments &FragmentSearch, KeySet RestrictedKeySet)
[14e73a]1483{
1484 int Counter = FragmentSearch.FragmentCounter; // mark current value of counter
1485
[a67d19]1486 DoLog(0) && (Log() << Verbose(0) << endl);
1487 DoLog(0) && (Log() << Verbose(0) << "Begin of PowerSetGenerator with order " << Order << " at Root " << *FragmentSearch.Root << "." << endl);
[14e73a]1488
[e138de]1489 SetSPList(Order, FragmentSearch);
[14e73a]1490
1491 // do a BFS search to fill the SP lists and label the found vertices
[e138de]1492 FillSPListandLabelVertices(Order, FragmentSearch, this, RestrictedKeySet);
[14e73a]1493
1494 // outputting all list for debugging
[e138de]1495 OutputSPList(Order, FragmentSearch);
[14e73a]1496
1497 // creating fragments with the found edge sets (may be done in reverse order, faster)
[e138de]1498 int SP = CountNumbersInBondsList(Order, FragmentSearch);
[a67d19]1499 DoLog(0) && (Log() << Verbose(0) << "Total number of edges is " << SP << "." << endl);
[cee0b57]1500 if (SP >= (Order-1)) {
1501 // start with root (push on fragment stack)
[a67d19]1502 DoLog(0) && (Log() << Verbose(0) << "Starting fragment generation with " << *FragmentSearch.Root << ", local nr is " << FragmentSearch.Root->nr << "." << endl);
[cee0b57]1503 FragmentSearch.FragmentSet->clear();
[a67d19]1504 DoLog(0) && (Log() << Verbose(0) << "Preparing subset for this root and calling generator." << endl);
[14e73a]1505
[cee0b57]1506 // prepare the subset and call the generator
[920c70]1507 bond* BondsList[FragmentSearch.BondsPerSPCount[0]];
1508 for(int i=0;i<FragmentSearch.BondsPerSPCount[0];i++)
1509 BondsList[i] = NULL;
[cee0b57]1510 BondsList[0] = FragmentSearch.BondsPerSPList[0]->next; // on SP level 0 there's only the root bond
1511
[e138de]1512 SPFragmentGenerator(&FragmentSearch, 0, BondsList, FragmentSearch.BondsPerSPCount[0], Order);
[cee0b57]1513 } else {
[a67d19]1514 DoLog(0) && (Log() << Verbose(0) << "Not enough total number of edges to build " << Order << "-body fragments." << endl);
[cee0b57]1515 }
1516
1517 // as FragmentSearch structure is used only once, we don't have to clean it anymore
1518 // remove root from stack
[a67d19]1519 DoLog(0) && (Log() << Verbose(0) << "Removing root again from stack." << endl);
[cee0b57]1520 FragmentSearch.FragmentSet->erase(FragmentSearch.Root->nr);
1521
1522 // free'ing the bonds lists
[e138de]1523 ResetSPList(Order, FragmentSearch);
[cee0b57]1524
1525 // return list
[a67d19]1526 DoLog(0) && (Log() << Verbose(0) << "End of PowerSetGenerator." << endl);
[cee0b57]1527 return (FragmentSearch.FragmentCounter - Counter);
1528};
1529
1530bool KeyCompare::operator() (const KeySet SubgraphA, const KeySet SubgraphB) const
1531{
[e138de]1532 //Log() << Verbose(0) << "my check is used." << endl;
[cee0b57]1533 if (SubgraphA.size() < SubgraphB.size()) {
1534 return true;
1535 } else {
1536 if (SubgraphA.size() > SubgraphB.size()) {
1537 return false;
1538 } else {
1539 KeySet::iterator IteratorA = SubgraphA.begin();
1540 KeySet::iterator IteratorB = SubgraphB.begin();
1541 while ((IteratorA != SubgraphA.end()) && (IteratorB != SubgraphB.end())) {
1542 if ((*IteratorA) < (*IteratorB))
1543 return true;
1544 else if ((*IteratorA) > (*IteratorB)) {
1545 return false;
1546 } // else, go on to next index
1547 IteratorA++;
1548 IteratorB++;
1549 } // end of while loop
1550 }// end of check in case of equal sizes
1551 }
1552 return false; // if we reach this point, they are equal
1553};
1554
1555
[407536]1556/** Combines all KeySets from all orders into single ones (with just unique entries).
1557 * \param *out output stream for debugging
1558 * \param *&FragmentList list to fill
1559 * \param ***FragmentLowerOrdersList
1560 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1561 * \param *mol molecule with atoms and bonds
1562 */
[e138de]1563int CombineAllOrderListIntoOne(Graph *&FragmentList, Graph ***FragmentLowerOrdersList, KeyStack &RootStack, molecule *mol)
[407536]1564{
1565 int RootNr = 0;
1566 int RootKeyNr = 0;
[93d120]1567 int StartNr = 0;
[407536]1568 int counter = 0;
1569 int NumLevels = 0;
1570 atom *Walker = NULL;
1571
[a67d19]1572 DoLog(0) && (Log() << Verbose(0) << "Combining the lists of all orders per order and finally into a single one." << endl);
[407536]1573 if (FragmentList == NULL) {
1574 FragmentList = new Graph;
1575 counter = 0;
1576 } else {
1577 counter = FragmentList->size();
1578 }
[93d120]1579
1580 StartNr = RootStack.back();
1581 do {
[407536]1582 RootKeyNr = RootStack.front();
1583 RootStack.pop_front();
1584 Walker = mol->FindAtom(RootKeyNr);
1585 NumLevels = 1 << (Walker->AdaptiveOrder - 1);
1586 for(int i=0;i<NumLevels;i++) {
1587 if (FragmentLowerOrdersList[RootNr][i] != NULL) {
[e138de]1588 InsertGraphIntoGraph(*FragmentList, (*FragmentLowerOrdersList[RootNr][i]), &counter);
[407536]1589 }
1590 }
1591 RootStack.push_back(Walker->nr);
1592 RootNr++;
[93d120]1593 } while (RootKeyNr != StartNr);
[407536]1594 return counter;
1595};
1596
1597/** Free's memory allocated for all KeySets from all orders.
1598 * \param *out output stream for debugging
1599 * \param ***FragmentLowerOrdersList
1600 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1601 * \param *mol molecule with atoms and bonds
1602 */
[e138de]1603void FreeAllOrdersList(Graph ***FragmentLowerOrdersList, KeyStack &RootStack, molecule *mol)
[407536]1604{
[a67d19]1605 DoLog(1) && (Log() << Verbose(1) << "Free'ing the lists of all orders per order." << endl);
[407536]1606 int RootNr = 0;
1607 int RootKeyNr = 0;
1608 int NumLevels = 0;
1609 atom *Walker = NULL;
1610 while (!RootStack.empty()) {
1611 RootKeyNr = RootStack.front();
1612 RootStack.pop_front();
1613 Walker = mol->FindAtom(RootKeyNr);
1614 NumLevels = 1 << (Walker->AdaptiveOrder - 1);
1615 for(int i=0;i<NumLevels;i++) {
1616 if (FragmentLowerOrdersList[RootNr][i] != NULL) {
1617 delete(FragmentLowerOrdersList[RootNr][i]);
1618 }
1619 }
[920c70]1620 delete[](FragmentLowerOrdersList[RootNr]);
[407536]1621 RootNr++;
1622 }
[920c70]1623 delete[](FragmentLowerOrdersList);
[407536]1624};
1625
1626
[cee0b57]1627/** Performs BOSSANOVA decomposition at selected sites, increasing the cutoff by one at these sites.
1628 * -# constructs a complete keyset of the molecule
1629 * -# In a loop over all possible roots from the given rootstack
1630 * -# increases order of root site
1631 * -# calls PowerSetGenerator with this order, the complete keyset and the rootkeynr
1632 * -# for all consecutive lower levels PowerSetGenerator is called with the suborder, the higher order keyset
1633as the restricted one and each site in the set as the root)
1634 * -# these are merged into a fragment list of keysets
1635 * -# All fragment lists (for all orders, i.e. from all destination fields) are merged into one list for return
1636 * Important only is that we create all fragments, it is not important if we create them more than once
1637 * as these copies are filtered out via use of the hash table (KeySet).
1638 * \param *out output stream for debugging
1639 * \param Fragment&*List list of already present keystacks (adaptive scheme) or empty list
1640 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1641 * \param *MinimumRingSize minimum ring size for each atom (molecule::Atomcount)
1642 * \return pointer to Graph list
1643 */
[e138de]1644void molecule::FragmentBOSSANOVA(Graph *&FragmentList, KeyStack &RootStack, int *MinimumRingSize)
[cee0b57]1645{
1646 Graph ***FragmentLowerOrdersList = NULL;
[407536]1647 int NumLevels = 0;
1648 int NumMolecules = 0;
1649 int TotalNumMolecules = 0;
1650 int *NumMoleculesOfOrder = NULL;
1651 int Order = 0;
[cee0b57]1652 int UpgradeCount = RootStack.size();
1653 KeyStack FragmentRootStack;
[407536]1654 int RootKeyNr = 0;
1655 int RootNr = 0;
[cee0b57]1656 struct UniqueFragments FragmentSearch;
1657
[a67d19]1658 DoLog(0) && (Log() << Verbose(0) << "Begin of FragmentBOSSANOVA." << endl);
[cee0b57]1659
1660 // FragmentLowerOrdersList is a 2D-array of pointer to MoleculeListClass objects, one dimension represents the ANOVA expansion of a single order (i.e. 5)
1661 // with all needed lower orders that are subtracted, the other dimension is the BondOrder (i.e. from 1 to 5)
[920c70]1662 NumMoleculesOfOrder = new int[UpgradeCount];
1663 FragmentLowerOrdersList = new Graph**[UpgradeCount];
1664
1665 for(int i=0;i<UpgradeCount;i++) {
1666 NumMoleculesOfOrder[i] = 0;
1667 FragmentLowerOrdersList[i] = NULL;
1668 }
[cee0b57]1669
1670 // initialise the fragments structure
1671 FragmentSearch.FragmentCounter = 0;
1672 FragmentSearch.FragmentSet = new KeySet;
1673 FragmentSearch.Root = FindAtom(RootKeyNr);
[1024cb]1674 FragmentSearch.ShortestPathList = new int[getAtomCount()];
[ea7176]1675 for (int i=getAtomCount();i--;) {
[cee0b57]1676 FragmentSearch.ShortestPathList[i] = -1;
1677 }
1678
1679 // Construct the complete KeySet which we need for topmost level only (but for all Roots)
1680 KeySet CompleteMolecule;
[9879f6]1681 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
1682 CompleteMolecule.insert((*iter)->GetTrueFather()->nr);
[cee0b57]1683 }
1684
1685 // this can easily be seen: if Order is 5, then the number of levels for each lower order is the total sum of the number of levels above, as
1686 // each has to be split up. E.g. for the second level we have one from 5th, one from 4th, two from 3th (which in turn is one from 5th, one from 4th),
1687 // hence we have overall four 2th order levels for splitting. This also allows for putting all into a single array (FragmentLowerOrdersList[])
1688 // with the order along the cells as this: 5433222211111111 for BondOrder 5 needing 16=pow(2,5-1) cells (only we use bit-shifting which is faster)
1689 RootNr = 0; // counts through the roots in RootStack
1690 while ((RootNr < UpgradeCount) && (!RootStack.empty())) {
1691 RootKeyNr = RootStack.front();
1692 RootStack.pop_front();
[9879f6]1693 atom *Walker = FindAtom(RootKeyNr);
[cee0b57]1694 // check cyclic lengths
1695 //if ((MinimumRingSize[Walker->GetTrueFather()->nr] != -1) && (Walker->GetTrueFather()->AdaptiveOrder+1 > MinimumRingSize[Walker->GetTrueFather()->nr])) {
[e138de]1696 // Log() << Verbose(0) << "Bond order " << Walker->GetTrueFather()->AdaptiveOrder << " of Root " << *Walker << " greater than or equal to Minimum Ring size of " << MinimumRingSize << " found is not allowed." << endl;
[cee0b57]1697 //} else
1698 {
1699 // increase adaptive order by one
1700 Walker->GetTrueFather()->AdaptiveOrder++;
1701 Order = Walker->AdaptiveOrder = Walker->GetTrueFather()->AdaptiveOrder;
1702
1703 // initialise Order-dependent entries of UniqueFragments structure
[e138de]1704 InitialiseSPList(Order, FragmentSearch);
[cee0b57]1705
1706 // allocate memory for all lower level orders in this 1D-array of ptrs
1707 NumLevels = 1 << (Order-1); // (int)pow(2,Order);
[920c70]1708 FragmentLowerOrdersList[RootNr] = new Graph*[NumLevels];
1709 for (int i=0;i<NumLevels;i++)
1710 FragmentLowerOrdersList[RootNr][i] = NULL;
[cee0b57]1711
1712 // create top order where nothing is reduced
[a67d19]1713 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
1714 DoLog(0) && (Log() << Verbose(0) << "Creating KeySets of Bond Order " << Order << " for " << *Walker << ", " << (RootStack.size()-RootNr) << " Roots remaining." << endl); // , NumLevels is " << NumLevels << "
[cee0b57]1715
1716 // Create list of Graphs of current Bond Order (i.e. F_{ij})
1717 FragmentLowerOrdersList[RootNr][0] = new Graph;
1718 FragmentSearch.TEFactor = 1.;
1719 FragmentSearch.Leaflet = FragmentLowerOrdersList[RootNr][0]; // set to insertion graph
1720 FragmentSearch.Root = Walker;
[e138de]1721 NumMoleculesOfOrder[RootNr] = PowerSetGenerator(Walker->AdaptiveOrder, FragmentSearch, CompleteMolecule);
[407536]1722
1723 // output resulting number
[a67d19]1724 DoLog(1) && (Log() << Verbose(1) << "Number of resulting KeySets is: " << NumMoleculesOfOrder[RootNr] << "." << endl);
[cee0b57]1725 if (NumMoleculesOfOrder[RootNr] != 0) {
1726 NumMolecules = 0;
1727 } else {
1728 Walker->GetTrueFather()->MaxOrder = true;
1729 }
1730 // now, we have completely filled each cell of FragmentLowerOrdersList[] for the current Walker->AdaptiveOrder
1731 //NumMoleculesOfOrder[Walker->AdaptiveOrder-1] = NumMolecules;
1732 TotalNumMolecules += NumMoleculesOfOrder[RootNr];
[e138de]1733// Log() << Verbose(1) << "Number of resulting molecules for Order " << (int)Walker->GetTrueFather()->AdaptiveOrder << " is: " << NumMoleculesOfOrder[RootNr] << "." << endl;
[cee0b57]1734 RootStack.push_back(RootKeyNr); // put back on stack
1735 RootNr++;
1736
1737 // free Order-dependent entries of UniqueFragments structure for next loop cycle
[e138de]1738 FreeSPList(Order, FragmentSearch);
[cee0b57]1739 }
1740 }
[a67d19]1741 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
1742 DoLog(1) && (Log() << Verbose(1) << "Total number of resulting molecules is: " << TotalNumMolecules << "." << endl);
1743 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
[cee0b57]1744
1745 // cleanup FragmentSearch structure
[920c70]1746 delete[](FragmentSearch.ShortestPathList);
[cee0b57]1747 delete(FragmentSearch.FragmentSet);
1748
1749 // now, FragmentLowerOrdersList is complete, it looks - for BondOrder 5 - as this (number is the ANOVA Order of the terms therein)
1750 // 5433222211111111
1751 // 43221111
1752 // 3211
1753 // 21
1754 // 1
1755
1756 // Subsequently, we combine all into a single list (FragmentList)
[e138de]1757 CombineAllOrderListIntoOne(FragmentList, FragmentLowerOrdersList, RootStack, this);
1758 FreeAllOrdersList(FragmentLowerOrdersList, RootStack, this);
[920c70]1759 delete[](NumMoleculesOfOrder);
[cee0b57]1760
[a67d19]1761 DoLog(0) && (Log() << Verbose(0) << "End of FragmentBOSSANOVA." << endl);
[cee0b57]1762};
1763
1764/** Corrects the nuclei position if the fragment was created over the cell borders.
1765 * Scans all bonds, checks the distance, if greater than typical, we have a candidate for the correction.
1766 * We remove the bond whereafter the graph probably separates. Then, we translate the one component periodically
1767 * and re-add the bond. Looping on the distance check.
1768 * \param *out ofstream for debugging messages
1769 */
[e138de]1770void molecule::ScanForPeriodicCorrection()
[cee0b57]1771{
1772 bond *Binder = NULL;
1773 bond *OtherBinder = NULL;
1774 atom *Walker = NULL;
1775 atom *OtherWalker = NULL;
[cca9ef]1776 RealSpaceMatrix matrix = World::getInstance().getDomain().getM();
[cee0b57]1777 enum Shading *ColorList = NULL;
1778 double tmp;
1779 Vector Translationvector;
[a564be]1780 //std::deque<atom *> *CompStack = NULL;
1781 std::deque<atom *> *AtomStack = new std::deque<atom *>; // (getAtomCount());
[cee0b57]1782 bool flag = true;
1783
[a67d19]1784 DoLog(2) && (Log() << Verbose(2) << "Begin of ScanForPeriodicCorrection." << endl);
[cee0b57]1785
[1024cb]1786 ColorList = new enum Shading[getAtomCount()];
1787 for (int i=0;i<getAtomCount();i++)
[920c70]1788 ColorList[i] = (enum Shading)0;
[cee0b57]1789 while (flag) {
1790 // remove bonds that are beyond bonddistance
[d4c9ae]1791 Translationvector.Zero();
[cee0b57]1792 // scan all bonds
1793 flag = false;
[e08c46]1794 for(molecule::iterator AtomRunner = begin(); (!flag) && (AtomRunner != end()); ++AtomRunner)
1795 for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); (!flag) && (BondRunner != (*AtomRunner)->ListOfBonds.end()); ++BondRunner) {
1796 Binder = (*BondRunner);
1797 for (int i=NDIM;i--;) {
[d74077]1798 tmp = fabs(Binder->leftatom->at(i) - Binder->rightatom->at(i));
[e08c46]1799 //Log() << Verbose(3) << "Checking " << i << "th distance of " << *Binder->leftatom << " to " << *Binder->rightatom << ": " << tmp << "." << endl;
1800 if (tmp > BondDistance) {
1801 OtherBinder = Binder->next; // note down binding partner for later re-insertion
1802 unlink(Binder); // unlink bond
1803 DoLog(2) && (Log() << Verbose(2) << "Correcting at bond " << *Binder << "." << endl);
1804 flag = true;
1805 break;
1806 }
[cee0b57]1807 }
1808 }
1809 if (flag) {
1810 // create translation vector from their periodically modified distance
1811 for (int i=NDIM;i--;) {
[d74077]1812 tmp = Binder->leftatom->at(i) - Binder->rightatom->at(i);
[cee0b57]1813 if (fabs(tmp) > BondDistance)
[0a4f7f]1814 Translationvector[i] = (tmp < 0) ? +1. : -1.;
[cee0b57]1815 }
[5108e1]1816 Translationvector *= matrix;
[e138de]1817 //Log() << Verbose(3) << "Translation vector is ";
[0a4f7f]1818 Log() << Verbose(0) << Translationvector << endl;
[cee0b57]1819 // apply to all atoms of first component via BFS
[ea7176]1820 for (int i=getAtomCount();i--;)
[cee0b57]1821 ColorList[i] = white;
[a564be]1822 AtomStack->push_front(Binder->leftatom);
1823 while (!AtomStack->empty()) {
1824 Walker = AtomStack->front();
1825 AtomStack->pop_front();
[e138de]1826 //Log() << Verbose (3) << "Current Walker is: " << *Walker << "." << endl;
[cee0b57]1827 ColorList[Walker->nr] = black; // mark as explored
[d74077]1828 *Walker += Translationvector; // translate
[266237]1829 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1830 if ((*Runner) != Binder) {
1831 OtherWalker = (*Runner)->GetOtherAtom(Walker);
[cee0b57]1832 if (ColorList[OtherWalker->nr] == white) {
[a564be]1833 AtomStack->push_front(OtherWalker); // push if yet unexplored
[cee0b57]1834 }
1835 }
1836 }
1837 }
1838 // re-add bond
1839 link(Binder, OtherBinder);
1840 } else {
[a67d19]1841 DoLog(3) && (Log() << Verbose(3) << "No corrections for this fragment." << endl);
[cee0b57]1842 }
1843 //delete(CompStack);
1844 }
1845 // free allocated space from ReturnFullMatrixforSymmetric()
1846 delete(AtomStack);
[920c70]1847 delete[](ColorList);
[a67d19]1848 DoLog(2) && (Log() << Verbose(2) << "End of ScanForPeriodicCorrection." << endl);
[cee0b57]1849};
Note: See TracBrowser for help on using the repository browser.