source: src/molecule_graph.cpp@ 4f7f34e

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since 4f7f34e was 35b698, checked in by Frederik Heber <heber@…>, 15 years ago

BIG CHANGE: config::load and config::save in ParseCommandLineOptions() and main() replaced with FormatParser replacements.

Fragmentation:

  • FIX: MoleculeFillWithMoleculeAction: filler atoms have to be removed before the system can be stored to file.
  • FIX: PcpParser::load() - has to put the molecule also into World's MoleculeListClass (otherwise the name cannot be set right after loading)
  • new Libparser.a
  • all sources from PARSER subdir are compiled into libparser such that only ParserUnitTest is recompiled.

Testfixes:

  • testsuite-fragmentation - changes to due to different -f calling syntax.
  • most of the xyz files had to be replaced due to a single whitespace at the end of each entry: Domain/6, Simple_configuration/2, Simple_configuration/3, Simple_configuration/4, Simple_configuration/5, Simple_configuration/8
  • in many cases were the number orbitals (and thus MaxMinStopStep) wrong: Filling/1, Simple_configuration/4, Simple_configuration/5

Signed-off-by: Frederik Heber <heber@…>

  • Property mode set to 100644
File size: 65.7 KB
RevLine 
[cee0b57]1/*
2 * molecule_graph.cpp
3 *
4 * Created on: Oct 5, 2009
5 * Author: heber
6 */
7
[112b09]8#include "Helpers/MemDebug.hpp"
9
[f66195]10#include "atom.hpp"
11#include "bond.hpp"
[b70721]12#include "bondgraph.hpp"
[cee0b57]13#include "config.hpp"
[35b698]14#include "defs.hpp"
[f66195]15#include "element.hpp"
16#include "helpers.hpp"
[c68c90]17#include "info.hpp"
[b8b75d]18#include "linkedcell.hpp"
[f66195]19#include "lists.hpp"
[e138de]20#include "log.hpp"
[cee0b57]21#include "memoryallocator.hpp"
22#include "molecule.hpp"
[b34306]23#include "World.hpp"
[0a4f7f]24#include "Helpers/fast_functions.hpp"
[f2bb0f]25#include "Helpers/Assert.hpp"
[cee0b57]26
27
[9eefda]28struct BFSAccounting
29{
30 atom **PredecessorList;
31 int *ShortestPathList;
32 enum Shading *ColorList;
33 class StackClass<atom *> *BFSStack;
34 class StackClass<atom *> *TouchedStack;
35 int AtomCount;
36 int BondOrder;
37 atom *Root;
38 bool BackStepping;
39 int CurrentGraphNr;
40 int ComponentNr;
41};
[cee0b57]42
[9eefda]43/** Accounting data for Depth First Search.
44 */
45struct DFSAccounting
46{
47 class StackClass<atom *> *AtomStack;
48 class StackClass<bond *> *BackEdgeStack;
49 int CurrentGraphNr;
50 int ComponentNumber;
51 atom *Root;
52 bool BackStepping;
53};
54
55/************************************* Functions for class molecule *********************************/
[cee0b57]56
57/** Creates an adjacency list of the molecule.
58 * We obtain an outside file with the indices of atoms which are bondmembers.
59 */
[e138de]60void molecule::CreateAdjacencyListFromDbondFile(ifstream *input)
[cee0b57]61{
[c68c90]62 Info FunctionInfo(__func__);
[cee0b57]63 // 1 We will parse bonds out of the dbond file created by tremolo.
[44a59b]64 int atom1, atom2;
65 atom *Walker, *OtherWalker;
[c68c90]66 char line[MAXSTRINGSIZE];
[44a59b]67
[c68c90]68 if (input->fail()) {
69 DoeLog(0) && (eLog() << Verbose(0) << "Opening of bond file failed \n");
70 performCriticalExit();
[44a59b]71 };
[bd6bfa]72 doCountAtoms();
[44a59b]73
[c68c90]74 // skip header
75 input->getline(line,MAXSTRINGSIZE);
76 DoLog(1) && (Log() << Verbose(1) << "Scanning file ... \n");
[44a59b]77 while (!input->eof()) // Check whether we read everything already
78 {
[c68c90]79 input->getline(line,MAXSTRINGSIZE);
80 stringstream zeile(line);
81 zeile >> atom1;
82 zeile >> atom2;
[44a59b]83
[c68c90]84 DoLog(2) && (Log() << Verbose(2) << "Looking for atoms " << atom1 << " and " << atom2 << "." << endl);
[9eefda]85 if (atom2 < atom1) //Sort indices of atoms in order
[44a59b]86 flip(atom1, atom2);
[9eefda]87 Walker = FindAtom(atom1);
[05a97c]88 ASSERT(Walker,"Could not find an atom with the ID given in dbond file");
[9eefda]89 OtherWalker = FindAtom(atom2);
[05a97c]90 ASSERT(OtherWalker,"Could not find an atom with the ID given in dbond file");
[44a59b]91 AddBond(Walker, OtherWalker); //Add the bond between the two atoms with respective indices.
92 }
[9eefda]93}
94;
[cee0b57]95
96/** Creates an adjacency list of the molecule.
97 * Generally, we use the CSD approach to bond recognition, that is the the distance
98 * between two atoms A and B must be within [Rcov(A)+Rcov(B)-t,Rcov(A)+Rcov(B)+t] with
99 * a threshold t = 0.4 Angstroem.
100 * To make it O(N log N) the function uses the linked-cell technique as follows:
101 * The procedure is step-wise:
102 * -# Remove every bond in list
103 * -# Count the atoms in the molecule with CountAtoms()
104 * -# partition cell into smaller linked cells of size \a bonddistance
105 * -# put each atom into its corresponding cell
106 * -# go through every cell, check the atoms therein against all possible bond partners in the 27 adjacent cells, add bond if true
107 * -# correct the bond degree iteratively (single->double->triple bond)
108 * -# finally print the bond list to \a *out if desired
109 * \param *out out stream for printing the matrix, NULL if no output
110 * \param bonddistance length of linked cells (i.e. maximum minimal length checked)
111 * \param IsAngstroem whether coordinate system is gauged to Angstroem or Bohr radii
[b70721]112 * \param *minmaxdistance function to give upper and lower bound on whether particle is bonded to some other
113 * \param *BG BondGraph with the member function above or NULL, if just standard covalent should be used.
[cee0b57]114 */
[e138de]115void molecule::CreateAdjacencyList(double bonddistance, bool IsAngstroem, void (BondGraph::*minmaxdistance)(BondedParticle * const , BondedParticle * const , double &, double &, bool), BondGraph *BG)
[cee0b57]116{
[b8b75d]117 atom *Walker = NULL;
118 atom *OtherWalker = NULL;
119 int n[NDIM];
[b70721]120 double MinDistance, MaxDistance;
[b8b75d]121 LinkedCell *LC = NULL;
[b70721]122 bool free_BG = false;
[5f612ee]123 double * const cell_size = World::getInstance().getDomain();
[b70721]124
125 if (BG == NULL) {
126 BG = new BondGraph(IsAngstroem);
127 free_BG = true;
128 }
[cee0b57]129
130 BondDistance = bonddistance; // * ((IsAngstroem) ? 1. : 1./AtomicLengthToAngstroem);
[a67d19]131 DoLog(0) && (Log() << Verbose(0) << "Begin of CreateAdjacencyList." << endl);
[cee0b57]132 // remove every bond from the list
[e08c46]133 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
134 for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); !(*AtomRunner)->ListOfBonds.empty(); BondRunner = (*AtomRunner)->ListOfBonds.begin())
135 if ((*BondRunner)->leftatom == *AtomRunner)
136 delete((*BondRunner));
[3c349b]137 BondCount = 0;
[cee0b57]138
139 // count atoms in molecule = dimension of matrix (also give each unique name and continuous numbering)
[a7b761b]140 DoLog(1) && (Log() << Verbose(1) << "AtomCount " << getAtomCount() << " and bonddistance is " << bonddistance << "." << endl);
[cee0b57]141
[ea7176]142 if ((getAtomCount() > 1) && (bonddistance > 1.)) {
[a67d19]143 DoLog(2) && (Log() << Verbose(2) << "Creating Linked Cell structure ... " << endl);
[b8b75d]144 LC = new LinkedCell(this, bonddistance);
[cee0b57]145
[b8b75d]146 // create a list to map Tesselpoint::nr to atom *
[a67d19]147 DoLog(2) && (Log() << Verbose(2) << "Creating TesselPoint to atom map ... " << endl);
[f2bb0f]148
[53731f]149 // set numbers for atoms that can later be used
150 int i=0;
151 for(internal_iterator iter = atoms.begin();iter!= atoms.end(); ++iter){
152 (*iter)->nr = i++;
[cee0b57]153 }
154
155 // 3a. go through every cell
[a67d19]156 DoLog(2) && (Log() << Verbose(2) << "Celling ... " << endl);
[b8b75d]157 for (LC->n[0] = 0; LC->n[0] < LC->N[0]; LC->n[0]++)
158 for (LC->n[1] = 0; LC->n[1] < LC->N[1]; LC->n[1]++)
159 for (LC->n[2] = 0; LC->n[2] < LC->N[2]; LC->n[2]++) {
[734816]160 const LinkedCell::LinkedNodes *List = LC->GetCurrentCell();
[e5ad5c]161// Log() << Verbose(2) << "Current cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
[b8b75d]162 if (List != NULL) {
[734816]163 for (LinkedCell::LinkedNodes::const_iterator Runner = List->begin(); Runner != List->end(); Runner++) {
[f2bb0f]164 Walker = dynamic_cast<atom*>(*Runner);
165 ASSERT(Walker,"Tesselpoint that was not an atom retrieved from LinkedNode");
[e138de]166 //Log() << Verbose(0) << "Current Atom is " << *Walker << "." << endl;
[cee0b57]167 // 3c. check for possible bond between each atom in this and every one in the 27 cells
[9eefda]168 for (n[0] = -1; n[0] <= 1; n[0]++)
169 for (n[1] = -1; n[1] <= 1; n[1]++)
170 for (n[2] = -1; n[2] <= 1; n[2]++) {
[734816]171 const LinkedCell::LinkedNodes *OtherList = LC->GetRelativeToCurrentCell(n);
[e5ad5c]172// Log() << Verbose(2) << "Current relative cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
[b8b75d]173 if (OtherList != NULL) {
[734816]174 for (LinkedCell::LinkedNodes::const_iterator OtherRunner = OtherList->begin(); OtherRunner != OtherList->end(); OtherRunner++) {
[b8b75d]175 if ((*OtherRunner)->nr > Walker->nr) {
[f2bb0f]176 OtherWalker = dynamic_cast<atom*>(*OtherRunner);
177 ASSERT(OtherWalker,"TesselPoint that was not an atom retrieved from LinkedNode");
[e138de]178 //Log() << Verbose(1) << "Checking distance " << OtherWalker->x.PeriodicDistanceSquared(&(Walker->x), cell_size) << " against typical bond length of " << bonddistance*bonddistance << "." << endl;
[e5ad5c]179 (BG->*minmaxdistance)(Walker, OtherWalker, MinDistance, MaxDistance, IsAngstroem);
[a7b761b]180 const double distance = OtherWalker->x.PeriodicDistanceSquared(Walker->x,cell_size);
[b70721]181 const bool status = (distance <= MaxDistance * MaxDistance) && (distance >= MinDistance * MinDistance);
[e5ad5c]182// Log() << Verbose(1) << "MinDistance is " << MinDistance << " and MaxDistance is " << MaxDistance << "." << endl;
183 if (OtherWalker->father->nr > Walker->father->nr) {
184 if (status) { // create bond if distance is smaller
185// Log() << Verbose(1) << "Adding Bond between " << *Walker << " and " << *OtherWalker << " in distance " << sqrt(distance) << "." << endl;
186 AddBond(Walker->father, OtherWalker->father, 1); // also increases molecule::BondCount
187 } else {
188// Log() << Verbose(1) << "Not Adding: distance too great." << endl;
189 }
[b8b75d]190 } else {
[e5ad5c]191// Log() << Verbose(1) << "Not Adding: Wrong order of labels." << endl;
[b8b75d]192 }
[cee0b57]193 }
194 }
195 }
196 }
197 }
198 }
199 }
[9eefda]200 delete (LC);
[a67d19]201 DoLog(1) && (Log() << Verbose(1) << "I detected " << BondCount << " bonds in the molecule with distance " << BondDistance << "." << endl);
[cee0b57]202
[b8b75d]203 // correct bond degree by comparing valence and bond degree
[a67d19]204 DoLog(2) && (Log() << Verbose(2) << "Correcting bond degree ... " << endl);
[e138de]205 CorrectBondDegree();
[cee0b57]206
[b8b75d]207 // output bonds for debugging (if bond chain list was correctly installed)
[e138de]208 ActOnAllAtoms( &atom::OutputBondOfAtom );
[b8b75d]209 } else
[a7b761b]210 DoLog(1) && (Log() << Verbose(1) << "AtomCount is " << getAtomCount() << ", thus no bonds, no connections!." << endl);
[a67d19]211 DoLog(0) && (Log() << Verbose(0) << "End of CreateAdjacencyList." << endl);
[b70721]212 if (free_BG)
213 delete(BG);
[9eefda]214}
215;
[cee0b57]216
[e08c46]217/** Checks for presence of bonds within atom list.
218 * TODO: more sophisticated check for bond structure (e.g. connected subgraph, ...)
219 * \return true - bonds present, false - no bonds
220 */
221bool molecule::hasBondStructure()
222{
223 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
224 if (!(*AtomRunner)->ListOfBonds.empty())
225 return true;
226 return false;
227}
228
229/** Counts the number of present bonds.
230 * \return number of bonds
231 */
232unsigned int molecule::CountBonds() const
233{
234 unsigned int counter = 0;
235 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
236 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
237 if ((*BondRunner)->leftatom == *AtomRunner)
238 counter++;
239 return counter;
240}
241
[b8b75d]242/** Prints a list of all bonds to \a *out.
243 * \param output stream
244 */
[e138de]245void molecule::OutputBondsList() const
[b8b75d]246{
[a67d19]247 DoLog(1) && (Log() << Verbose(1) << endl << "From contents of bond chain list:");
[e08c46]248 for(molecule::const_iterator AtomRunner = molecule::begin(); AtomRunner != molecule::end(); ++AtomRunner)
249 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
250 if ((*BondRunner)->leftatom == *AtomRunner) {
251 DoLog(0) && (Log() << Verbose(0) << *(*BondRunner) << "\t" << endl);
252 }
[a67d19]253 DoLog(0) && (Log() << Verbose(0) << endl);
[9eefda]254}
255;
[cee0b57]256
[b8b75d]257/** correct bond degree by comparing valence and bond degree.
258 * correct Bond degree of each bond by checking both bond partners for a mismatch between valence and current sum of bond degrees,
259 * iteratively increase the one first where the other bond partner has the fewest number of bonds (i.e. in general bonds oxygene
260 * preferred over carbon bonds). Beforehand, we had picked the first mismatching partner, which lead to oxygenes with single instead of
261 * double bonds as was expected.
262 * \param *out output stream for debugging
263 * \return number of bonds that could not be corrected
264 */
[e138de]265int molecule::CorrectBondDegree() const
[b8b75d]266{
[99593f]267 int No = 0, OldNo = -1;
[b8b75d]268
269 if (BondCount != 0) {
[a67d19]270 DoLog(1) && (Log() << Verbose(1) << "Correcting Bond degree of each bond ... " << endl);
[b8b75d]271 do {
[99593f]272 OldNo = No;
[e138de]273 No = SumPerAtom( &atom::CorrectBondDegree );
[99593f]274 } while (OldNo != No);
[a67d19]275 DoLog(0) && (Log() << Verbose(0) << " done." << endl);
[b8b75d]276 } else {
[a7b761b]277 DoLog(1) && (Log() << Verbose(1) << "BondCount is " << BondCount << ", no bonds between any of the " << getAtomCount() << " atoms." << endl);
[b8b75d]278 }
[a67d19]279 DoLog(0) && (Log() << Verbose(0) << No << " bonds could not be corrected." << endl);
[cee0b57]280
[266237]281 return (No);
[9eefda]282}
283;
[cee0b57]284
285/** Counts all cyclic bonds and returns their number.
286 * \note Hydrogen bonds can never by cyclic, thus no check for that
287 * \param *out output stream for debugging
288 * \return number opf cyclic bonds
289 */
[e138de]290int molecule::CountCyclicBonds()
[cee0b57]291{
[266237]292 NoCyclicBonds = 0;
[cee0b57]293 int *MinimumRingSize = NULL;
294 MoleculeLeafClass *Subgraphs = NULL;
295 class StackClass<bond *> *BackEdgeStack = NULL;
[e08c46]296 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
297 if ((!(*AtomRunner)->ListOfBonds.empty()) && ((*(*AtomRunner)->ListOfBonds.begin())->Type == Undetermined)) {
298 DoLog(0) && (Log() << Verbose(0) << "No Depth-First-Search analysis performed so far, calling ..." << endl);
299 Subgraphs = DepthFirstSearchAnalysis(BackEdgeStack);
300 while (Subgraphs->next != NULL) {
301 Subgraphs = Subgraphs->next;
302 delete (Subgraphs->previous);
303 }
304 delete (Subgraphs);
305 delete[] (MinimumRingSize);
306 break;
[cee0b57]307 }
[e08c46]308 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
309 for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
310 if ((*BondRunner)->leftatom == *AtomRunner)
311 if ((*BondRunner)->Cyclic)
312 NoCyclicBonds++;
[9eefda]313 delete (BackEdgeStack);
[266237]314 return NoCyclicBonds;
[9eefda]315}
316;
[b8b75d]317
[cee0b57]318/** Returns Shading as a char string.
319 * \param color the Shading
320 * \return string of the flag
321 */
[fa649a]322string molecule::GetColor(enum Shading color) const
[cee0b57]323{
[9eefda]324 switch (color) {
[cee0b57]325 case white:
326 return "white";
327 break;
328 case lightgray:
329 return "lightgray";
330 break;
331 case darkgray:
332 return "darkgray";
333 break;
334 case black:
335 return "black";
336 break;
337 default:
338 return "uncolored";
339 break;
340 };
[9eefda]341}
342;
[cee0b57]343
[9eefda]344/** Sets atom::GraphNr and atom::LowpointNr to BFSAccounting::CurrentGraphNr.
345 * \param *out output stream for debugging
346 * \param *Walker current node
347 * \param &BFS structure with accounting data for BFS
348 */
[e138de]349void DepthFirstSearchAnalysis_SetWalkersGraphNr(atom *&Walker, struct DFSAccounting &DFS)
[174e0e]350{
[9eefda]351 if (!DFS.BackStepping) { // if we don't just return from (8)
352 Walker->GraphNr = DFS.CurrentGraphNr;
353 Walker->LowpointNr = DFS.CurrentGraphNr;
[68f03d]354 DoLog(1) && (Log() << Verbose(1) << "Setting Walker[" << Walker->getName() << "]'s number to " << Walker->GraphNr << " with Lowpoint " << Walker->LowpointNr << "." << endl);
[9eefda]355 DFS.AtomStack->Push(Walker);
356 DFS.CurrentGraphNr++;
[174e0e]357 }
[9eefda]358}
359;
[174e0e]360
[9eefda]361/** During DFS goes along unvisited bond and touches other atom.
362 * Sets bond::type, if
363 * -# BackEdge: set atom::LowpointNr and push on \a BackEdgeStack
364 * -# TreeEgde: set atom::Ancestor and continue with Walker along this edge
365 * Continue until molecule::FindNextUnused() finds no more unused bonds.
366 * \param *out output stream for debugging
367 * \param *mol molecule with atoms and finding unused bonds
368 * \param *&Binder current edge
369 * \param &DFS DFS accounting data
370 */
[e138de]371void DepthFirstSearchAnalysis_ProbeAlongUnusedBond(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS)
[174e0e]372{
373 atom *OtherAtom = NULL;
374
375 do { // (3) if Walker has no unused egdes, go to (5)
[9eefda]376 DFS.BackStepping = false; // reset backstepping flag for (8)
[174e0e]377 if (Binder == NULL) // if we don't just return from (11), Binder is already set to next unused
378 Binder = mol->FindNextUnused(Walker);
379 if (Binder == NULL)
380 break;
[a67d19]381 DoLog(2) && (Log() << Verbose(2) << "Current Unused Bond is " << *Binder << "." << endl);
[174e0e]382 // (4) Mark Binder used, ...
383 Binder->MarkUsed(black);
384 OtherAtom = Binder->GetOtherAtom(Walker);
[68f03d]385 DoLog(2) && (Log() << Verbose(2) << "(4) OtherAtom is " << OtherAtom->getName() << "." << endl);
[174e0e]386 if (OtherAtom->GraphNr != -1) {
387 // (4a) ... if "other" atom has been visited (GraphNr != 0), set lowpoint to minimum of both, go to (3)
388 Binder->Type = BackEdge;
[9eefda]389 DFS.BackEdgeStack->Push(Binder);
390 Walker->LowpointNr = (Walker->LowpointNr < OtherAtom->GraphNr) ? Walker->LowpointNr : OtherAtom->GraphNr;
[68f03d]391 DoLog(3) && (Log() << Verbose(3) << "(4a) Visited: Setting Lowpoint of Walker[" << Walker->getName() << "] to " << Walker->LowpointNr << "." << endl);
[174e0e]392 } else {
393 // (4b) ... otherwise set OtherAtom as Ancestor of Walker and Walker as OtherAtom, go to (2)
394 Binder->Type = TreeEdge;
395 OtherAtom->Ancestor = Walker;
396 Walker = OtherAtom;
[68f03d]397 DoLog(3) && (Log() << Verbose(3) << "(4b) Not Visited: OtherAtom[" << OtherAtom->getName() << "]'s Ancestor is now " << OtherAtom->Ancestor->getName() << ", Walker is OtherAtom " << OtherAtom->getName() << "." << endl);
[174e0e]398 break;
399 }
400 Binder = NULL;
[9eefda]401 } while (1); // (3)
402}
403;
[174e0e]404
[9eefda]405/** Checks whether we have a new component.
406 * if atom::LowpointNr of \a *&Walker is greater than atom::GraphNr of its atom::Ancestor, we have a new component.
407 * Meaning that if we touch upon a node who suddenly has a smaller atom::LowpointNr than its ancestor, then we
408 * have a found a new branch in the graph tree.
409 * \param *out output stream for debugging
410 * \param *mol molecule with atoms and finding unused bonds
411 * \param *&Walker current node
412 * \param &DFS DFS accounting data
413 */
[e138de]414void DepthFirstSearchAnalysis_CheckForaNewComponent(const molecule * const mol, atom *&Walker, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
[174e0e]415{
416 atom *OtherAtom = NULL;
417
418 // (5) if Ancestor of Walker is ...
[68f03d]419 DoLog(1) && (Log() << Verbose(1) << "(5) Number of Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "] is " << Walker->Ancestor->GraphNr << "." << endl);
[174e0e]420
[9eefda]421 if (Walker->Ancestor->GraphNr != DFS.Root->GraphNr) {
[174e0e]422 // (6) (Ancestor of Walker is not Root)
423 if (Walker->LowpointNr < Walker->Ancestor->GraphNr) {
424 // (6a) set Ancestor's Lowpoint number to minimum of of its Ancestor and itself, go to Step(8)
425 Walker->Ancestor->LowpointNr = (Walker->Ancestor->LowpointNr < Walker->LowpointNr) ? Walker->Ancestor->LowpointNr : Walker->LowpointNr;
[68f03d]426 DoLog(2) && (Log() << Verbose(2) << "(6) Setting Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s Lowpoint to " << Walker->Ancestor->LowpointNr << "." << endl);
[174e0e]427 } else {
428 // (7) (Ancestor of Walker is a separating vertex, remove all from stack till Walker (including), these and Ancestor form a component
429 Walker->Ancestor->SeparationVertex = true;
[68f03d]430 DoLog(2) && (Log() << Verbose(2) << "(7) Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s is a separating vertex, creating component." << endl);
[9eefda]431 mol->SetNextComponentNumber(Walker->Ancestor, DFS.ComponentNumber);
[68f03d]432 DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Ancestor's Compont is " << DFS.ComponentNumber << "." << endl);
[9eefda]433 mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
[68f03d]434 DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]435 do {
[9eefda]436 OtherAtom = DFS.AtomStack->PopLast();
[174e0e]437 LeafWalker->Leaf->AddCopyAtom(OtherAtom);
[9eefda]438 mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
[68f03d]439 DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]440 } while (OtherAtom != Walker);
[9eefda]441 DFS.ComponentNumber++;
[174e0e]442 }
443 // (8) Walker becomes its Ancestor, go to (3)
[68f03d]444 DoLog(2) && (Log() << Verbose(2) << "(8) Walker[" << Walker->getName() << "] is now its Ancestor " << Walker->Ancestor->getName() << ", backstepping. " << endl);
[174e0e]445 Walker = Walker->Ancestor;
[9eefda]446 DFS.BackStepping = true;
[174e0e]447 }
[9eefda]448}
449;
[174e0e]450
[9eefda]451/** Cleans the root stack when we have found a component.
452 * If we are not DFSAccounting::BackStepping, then we clear the root stack by putting everything into a
453 * component down till we meet DFSAccounting::Root.
454 * \param *out output stream for debugging
455 * \param *mol molecule with atoms and finding unused bonds
456 * \param *&Walker current node
457 * \param *&Binder current edge
458 * \param &DFS DFS accounting data
459 */
[e138de]460void DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
[174e0e]461{
462 atom *OtherAtom = NULL;
463
[9eefda]464 if (!DFS.BackStepping) { // coming from (8) want to go to (3)
[174e0e]465 // (9) remove all from stack till Walker (including), these and Root form a component
[99593f]466 //DFS.AtomStack->Output(out);
[9eefda]467 mol->SetNextComponentNumber(DFS.Root, DFS.ComponentNumber);
[68f03d]468 DoLog(3) && (Log() << Verbose(3) << "(9) Root[" << DFS.Root->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
[9eefda]469 mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
[68f03d]470 DoLog(3) && (Log() << Verbose(3) << "(9) Walker[" << Walker->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
[174e0e]471 do {
[9eefda]472 OtherAtom = DFS.AtomStack->PopLast();
[174e0e]473 LeafWalker->Leaf->AddCopyAtom(OtherAtom);
[9eefda]474 mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
[68f03d]475 DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]476 } while (OtherAtom != Walker);
[9eefda]477 DFS.ComponentNumber++;
[174e0e]478
479 // (11) Root is separation vertex, set Walker to Root and go to (4)
[9eefda]480 Walker = DFS.Root;
[174e0e]481 Binder = mol->FindNextUnused(Walker);
[68f03d]482 DoLog(1) && (Log() << Verbose(1) << "(10) Walker is Root[" << DFS.Root->getName() << "], next Unused Bond is " << Binder << "." << endl);
[174e0e]483 if (Binder != NULL) { // Root is separation vertex
[a67d19]484 DoLog(1) && (Log() << Verbose(1) << "(11) Root is a separation vertex." << endl);
[174e0e]485 Walker->SeparationVertex = true;
486 }
487 }
[9eefda]488}
489;
490
491/** Initializes DFSAccounting structure.
492 * \param *out output stream for debugging
493 * \param &DFS accounting structure to allocate
[7218f8]494 * \param *mol molecule with AtomCount, BondCount and all atoms
[9eefda]495 */
[e138de]496void DepthFirstSearchAnalysis_Init(struct DFSAccounting &DFS, const molecule * const mol)
[9eefda]497{
[ea7176]498 DFS.AtomStack = new StackClass<atom *> (mol->getAtomCount());
[9eefda]499 DFS.CurrentGraphNr = 0;
500 DFS.ComponentNumber = 0;
501 DFS.BackStepping = false;
[7218f8]502 mol->ResetAllBondsToUnused();
503 mol->SetAtomValueToValue(-1, &atom::GraphNr);
504 mol->ActOnAllAtoms(&atom::InitComponentNr);
505 DFS.BackEdgeStack->ClearStack();
[9eefda]506}
507;
[174e0e]508
[9eefda]509/** Free's DFSAccounting structure.
510 * \param *out output stream for debugging
511 * \param &DFS accounting structure to free
512 */
[e138de]513void DepthFirstSearchAnalysis_Finalize(struct DFSAccounting &DFS)
[9eefda]514{
515 delete (DFS.AtomStack);
[7218f8]516 // delete (DFS.BackEdgeStack); // DON'T free, see DepthFirstSearchAnalysis(), is returned as allocated
[9eefda]517}
518;
[174e0e]519
[cee0b57]520/** Performs a Depth-First search on this molecule.
521 * Marks bonds in molecule as cyclic, bridge, ... and atoms as
522 * articulations points, ...
523 * We use the algorithm from [Even, Graph Algorithms, p.62].
524 * \param *out output stream for debugging
525 * \param *&BackEdgeStack NULL pointer to StackClass with all the found back edges, allocated and filled on return
526 * \return list of each disconnected subgraph as an individual molecule class structure
527 */
[e138de]528MoleculeLeafClass * molecule::DepthFirstSearchAnalysis(class StackClass<bond *> *&BackEdgeStack) const
[cee0b57]529{
[9eefda]530 struct DFSAccounting DFS;
[cee0b57]531 BackEdgeStack = new StackClass<bond *> (BondCount);
[9eefda]532 DFS.BackEdgeStack = BackEdgeStack;
[cee0b57]533 MoleculeLeafClass *SubGraphs = new MoleculeLeafClass(NULL);
534 MoleculeLeafClass *LeafWalker = SubGraphs;
[9eefda]535 int OldGraphNr = 0;
[174e0e]536 atom *Walker = NULL;
[cee0b57]537 bond *Binder = NULL;
538
[a7b761b]539 if (getAtomCount() == 0)
[046783]540 return SubGraphs;
[a67d19]541 DoLog(0) && (Log() << Verbose(0) << "Begin of DepthFirstSearchAnalysis" << endl);
[e138de]542 DepthFirstSearchAnalysis_Init(DFS, this);
[cee0b57]543
[9879f6]544 for (molecule::const_iterator iter = begin(); iter != end();) {
545 DFS.Root = *iter;
[7218f8]546 // (1) mark all edges unused, empty stack, set atom->GraphNr = -1 for all
[9eefda]547 DFS.AtomStack->ClearStack();
[cee0b57]548
549 // put into new subgraph molecule and add this to list of subgraphs
550 LeafWalker = new MoleculeLeafClass(LeafWalker);
[5f612ee]551 LeafWalker->Leaf = World::getInstance().createMolecule();
[9eefda]552 LeafWalker->Leaf->AddCopyAtom(DFS.Root);
[cee0b57]553
[9eefda]554 OldGraphNr = DFS.CurrentGraphNr;
555 Walker = DFS.Root;
[cee0b57]556 do { // (10)
557 do { // (2) set number and Lowpoint of Atom to i, increase i, push current atom
[e138de]558 DepthFirstSearchAnalysis_SetWalkersGraphNr(Walker, DFS);
[174e0e]559
[e138de]560 DepthFirstSearchAnalysis_ProbeAlongUnusedBond(this, Walker, Binder, DFS);
[174e0e]561
[cee0b57]562 if (Binder == NULL) {
[a67d19]563 DoLog(2) && (Log() << Verbose(2) << "No more Unused Bonds." << endl);
[cee0b57]564 break;
565 } else
566 Binder = NULL;
[9eefda]567 } while (1); // (2)
[cee0b57]568
569 // if we came from backstepping, yet there were no more unused bonds, we end up here with no Ancestor, because Walker is Root! Then we are finished!
[9eefda]570 if ((Walker == DFS.Root) && (Binder == NULL))
[cee0b57]571 break;
572
[e138de]573 DepthFirstSearchAnalysis_CheckForaNewComponent(this, Walker, DFS, LeafWalker);
[174e0e]574
[e138de]575 DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(this, Walker, Binder, DFS, LeafWalker);
[174e0e]576
[9eefda]577 } while ((DFS.BackStepping) || (Binder != NULL)); // (10) halt only if Root has no unused edges
[cee0b57]578
579 // From OldGraphNr to CurrentGraphNr ranges an disconnected subgraph
[a67d19]580 DoLog(0) && (Log() << Verbose(0) << "Disconnected subgraph ranges from " << OldGraphNr << " to " << DFS.CurrentGraphNr << "." << endl);
[e138de]581 LeafWalker->Leaf->Output((ofstream *)&cout);
[a67d19]582 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]583
584 // step on to next root
[9879f6]585 while ((iter != end()) && ((*iter)->GraphNr != -1)) {
586 //Log() << Verbose(1) << "Current next subgraph root candidate is " << (*iter)->Name << "." << endl;
587 if ((*iter)->GraphNr != -1) // if already discovered, step on
588 iter++;
[cee0b57]589 }
590 }
591 // set cyclic bond criterium on "same LP" basis
[266237]592 CyclicBondAnalysis();
593
[e138de]594 OutputGraphInfoPerAtom();
[266237]595
[e138de]596 OutputGraphInfoPerBond();
[266237]597
598 // free all and exit
[e138de]599 DepthFirstSearchAnalysis_Finalize(DFS);
[a67d19]600 DoLog(0) && (Log() << Verbose(0) << "End of DepthFirstSearchAnalysis" << endl);
[266237]601 return SubGraphs;
[9eefda]602}
603;
[266237]604
605/** Scans through all bonds and set bond::Cyclic to true where atom::LowpointNr of both ends is equal: LP criterion.
606 */
[fa649a]607void molecule::CyclicBondAnalysis() const
[266237]608{
609 NoCyclicBonds = 0;
[e08c46]610 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
611 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
612 if ((*BondRunner)->leftatom == *AtomRunner)
613 if ((*BondRunner)->rightatom->LowpointNr == (*BondRunner)->leftatom->LowpointNr) { // cyclic ??
614 (*BondRunner)->Cyclic = true;
615 NoCyclicBonds++;
616 }
[9eefda]617}
618;
[cee0b57]619
[266237]620/** Output graph information per atom.
621 * \param *out output stream
622 */
[e138de]623void molecule::OutputGraphInfoPerAtom() const
[266237]624{
[a67d19]625 DoLog(1) && (Log() << Verbose(1) << "Final graph info for each atom is:" << endl);
[e138de]626 ActOnAllAtoms( &atom::OutputGraphInfo );
[9eefda]627}
628;
[cee0b57]629
[266237]630/** Output graph information per bond.
631 * \param *out output stream
632 */
[e138de]633void molecule::OutputGraphInfoPerBond() const
[266237]634{
[e08c46]635 bond *Binder = NULL;
[a67d19]636 DoLog(1) && (Log() << Verbose(1) << "Final graph info for each bond is:" << endl);
[e08c46]637 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
[bd6bfa]638 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
[e08c46]639 if ((*BondRunner)->leftatom == *AtomRunner) {
640 Binder = *BondRunner;
641 DoLog(2) && (Log() << Verbose(2) << ((Binder->Type == TreeEdge) ? "TreeEdge " : "BackEdge ") << *Binder << ": <");
642 DoLog(0) && (Log() << Verbose(0) << ((Binder->leftatom->SeparationVertex) ? "SP," : "") << "L" << Binder->leftatom->LowpointNr << " G" << Binder->leftatom->GraphNr << " Comp.");
643 Binder->leftatom->OutputComponentNumber();
644 DoLog(0) && (Log() << Verbose(0) << " === ");
645 DoLog(0) && (Log() << Verbose(0) << ((Binder->rightatom->SeparationVertex) ? "SP," : "") << "L" << Binder->rightatom->LowpointNr << " G" << Binder->rightatom->GraphNr << " Comp.");
646 Binder->rightatom->OutputComponentNumber();
647 DoLog(0) && (Log() << Verbose(0) << ">." << endl);
648 if (Binder->Cyclic) // cyclic ??
649 DoLog(3) && (Log() << Verbose(3) << "Lowpoint at each side are equal: CYCLIC!" << endl);
650 }
[9eefda]651}
652;
653
654/** Initialise each vertex as white with no predecessor, empty queue, color Root lightgray.
655 * \param *out output stream for debugging
656 * \param &BFS accounting structure
657 * \param AtomCount number of entries in the array to allocate
658 */
[e138de]659void InitializeBFSAccounting(struct BFSAccounting &BFS, int AtomCount)
[9eefda]660{
661 BFS.AtomCount = AtomCount;
[920c70]662 BFS.PredecessorList = new atom*[AtomCount];
663 BFS.ShortestPathList = new int[AtomCount];
664 BFS.ColorList = new enum Shading[AtomCount];
[9eefda]665 BFS.BFSStack = new StackClass<atom *> (AtomCount);
666
[920c70]667 for (int i = AtomCount; i--;) {
[9eefda]668 BFS.ShortestPathList[i] = -1;
[920c70]669 BFS.PredecessorList[i] = 0;
670 }
[cee0b57]671};
672
[9eefda]673/** Free's accounting structure.
674 * \param *out output stream for debugging
675 * \param &BFS accounting structure
676 */
[e138de]677void FinalizeBFSAccounting(struct BFSAccounting &BFS)
[9eefda]678{
[920c70]679 delete[](BFS.PredecessorList);
680 delete[](BFS.ShortestPathList);
681 delete[](BFS.ColorList);
[9eefda]682 delete (BFS.BFSStack);
683 BFS.AtomCount = 0;
684};
685
686/** Clean the accounting structure.
687 * \param *out output stream for debugging
688 * \param &BFS accounting structure
[ef9aae]689 */
[e138de]690void CleanBFSAccounting(struct BFSAccounting &BFS)
[ef9aae]691{
[9eefda]692 atom *Walker = NULL;
693 while (!BFS.TouchedStack->IsEmpty()) {
694 Walker = BFS.TouchedStack->PopFirst();
695 BFS.PredecessorList[Walker->nr] = NULL;
696 BFS.ShortestPathList[Walker->nr] = -1;
697 BFS.ColorList[Walker->nr] = white;
[ef9aae]698 }
699};
700
[9eefda]701/** Resets shortest path list and BFSStack.
702 * \param *out output stream for debugging
703 * \param *&Walker current node, pushed onto BFSAccounting::BFSStack and BFSAccounting::TouchedStack
704 * \param &BFS accounting structure
705 */
[e138de]706void ResetBFSAccounting(atom *&Walker, struct BFSAccounting &BFS)
[ef9aae]707{
[9eefda]708 BFS.ShortestPathList[Walker->nr] = 0;
709 BFS.BFSStack->ClearStack(); // start with empty BFS stack
710 BFS.BFSStack->Push(Walker);
711 BFS.TouchedStack->Push(Walker);
[ef9aae]712};
713
[9eefda]714/** Performs a BFS from \a *Root, trying to find the same node and hence a cycle.
715 * \param *out output stream for debugging
716 * \param *&BackEdge the edge from root that we don't want to move along
717 * \param &BFS accounting structure
718 */
[e138de]719void CyclicStructureAnalysis_CyclicBFSFromRootToRoot(bond *&BackEdge, struct BFSAccounting &BFS)
[ef9aae]720{
721 atom *Walker = NULL;
722 atom *OtherAtom = NULL;
[9eefda]723 do { // look for Root
724 Walker = BFS.BFSStack->PopFirst();
[a67d19]725 DoLog(2) && (Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *BFS.Root << "." << endl);
[ef9aae]726 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
727 if ((*Runner) != BackEdge) { // only walk along DFS spanning tree (otherwise we always find SP of one being backedge Binder)
728 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[9eefda]729#ifdef ADDHYDROGEN
[ef9aae]730 if (OtherAtom->type->Z != 1) {
[9eefda]731#endif
[68f03d]732 DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
[9eefda]733 if (BFS.ColorList[OtherAtom->nr] == white) {
734 BFS.TouchedStack->Push(OtherAtom);
735 BFS.ColorList[OtherAtom->nr] = lightgray;
736 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
737 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[68f03d]738 DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " lightgray, its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
[9eefda]739 //if (BFS.ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr]) { // Check for maximum distance
[a67d19]740 DoLog(3) && (Log() << Verbose(3) << "Putting OtherAtom into queue." << endl);
[9eefda]741 BFS.BFSStack->Push(OtherAtom);
742 //}
[ef9aae]743 } else {
[a67d19]744 DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
[ef9aae]745 }
[9eefda]746 if (OtherAtom == BFS.Root)
747 break;
748#ifdef ADDHYDROGEN
749 } else {
[a67d19]750 DoLog(2) && (Log() << Verbose(2) << "Skipping hydrogen atom " << *OtherAtom << "." << endl);
[9eefda]751 BFS.ColorList[OtherAtom->nr] = black;
752 }
753#endif
[ef9aae]754 } else {
[a67d19]755 DoLog(2) && (Log() << Verbose(2) << "Bond " << *(*Runner) << " not Visiting, is the back edge." << endl);
[ef9aae]756 }
757 }
[9eefda]758 BFS.ColorList[Walker->nr] = black;
[68f03d]759 DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
[9eefda]760 if (OtherAtom == BFS.Root) { // if we have found the root, check whether this cycle wasn't already found beforehand
[ef9aae]761 // step through predecessor list
762 while (OtherAtom != BackEdge->rightatom) {
[9eefda]763 if (!OtherAtom->GetTrueFather()->IsCyclic) // if one bond in the loop is not marked as cyclic, we haven't found this cycle yet
[ef9aae]764 break;
765 else
[9eefda]766 OtherAtom = BFS.PredecessorList[OtherAtom->nr];
[ef9aae]767 }
768 if (OtherAtom == BackEdge->rightatom) { // if each atom in found cycle is cyclic, loop's been found before already
[a67d19]769 DoLog(3) && (Log() << Verbose(3) << "This cycle was already found before, skipping and removing seeker from search." << endl);
[ef9aae]770 do {
[9eefda]771 OtherAtom = BFS.TouchedStack->PopLast();
772 if (BFS.PredecessorList[OtherAtom->nr] == Walker) {
[a67d19]773 DoLog(4) && (Log() << Verbose(4) << "Removing " << *OtherAtom << " from lists and stacks." << endl);
[9eefda]774 BFS.PredecessorList[OtherAtom->nr] = NULL;
775 BFS.ShortestPathList[OtherAtom->nr] = -1;
776 BFS.ColorList[OtherAtom->nr] = white;
777 BFS.BFSStack->RemoveItem(OtherAtom);
[ef9aae]778 }
[9eefda]779 } while ((!BFS.TouchedStack->IsEmpty()) && (BFS.PredecessorList[OtherAtom->nr] == NULL));
780 BFS.TouchedStack->Push(OtherAtom); // last was wrongly popped
[ef9aae]781 OtherAtom = BackEdge->rightatom; // set to not Root
782 } else
[9eefda]783 OtherAtom = BFS.Root;
[ef9aae]784 }
[9eefda]785 } while ((!BFS.BFSStack->IsEmpty()) && (OtherAtom != BFS.Root) && (OtherAtom != NULL)); // || (ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr])));
[ef9aae]786};
787
[9eefda]788/** Climb back the BFSAccounting::PredecessorList and find cycle members.
789 * \param *out output stream for debugging
790 * \param *&OtherAtom
791 * \param *&BackEdge denotes the edge we did not want to travel along when doing CyclicBFSFromRootToRoot()
792 * \param &BFS accounting structure
793 * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
794 * \param &MinRingSize global minimum distance from one node without encountering oneself, set on return
795 */
[e138de]796void CyclicStructureAnalysis_RetrieveCycleMembers(atom *&OtherAtom, bond *&BackEdge, struct BFSAccounting &BFS, int *&MinimumRingSize, int &MinRingSize)
[ef9aae]797{
798 atom *Walker = NULL;
799 int NumCycles = 0;
800 int RingSize = -1;
801
[9eefda]802 if (OtherAtom == BFS.Root) {
[ef9aae]803 // now climb back the predecessor list and thus find the cycle members
804 NumCycles++;
805 RingSize = 1;
[9eefda]806 BFS.Root->GetTrueFather()->IsCyclic = true;
[a67d19]807 DoLog(1) && (Log() << Verbose(1) << "Found ring contains: ");
[9eefda]808 Walker = BFS.Root;
[ef9aae]809 while (Walker != BackEdge->rightatom) {
[68f03d]810 DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " <-> ");
[9eefda]811 Walker = BFS.PredecessorList[Walker->nr];
[ef9aae]812 Walker->GetTrueFather()->IsCyclic = true;
813 RingSize++;
814 }
[68f03d]815 DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " with a length of " << RingSize << "." << endl << endl);
[ef9aae]816 // walk through all and set MinimumRingSize
[9eefda]817 Walker = BFS.Root;
[ef9aae]818 MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
819 while (Walker != BackEdge->rightatom) {
[9eefda]820 Walker = BFS.PredecessorList[Walker->nr];
[ef9aae]821 if (RingSize < MinimumRingSize[Walker->GetTrueFather()->nr])
822 MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
823 }
824 if ((RingSize < MinRingSize) || (MinRingSize == -1))
825 MinRingSize = RingSize;
826 } else {
[a67d19]827 DoLog(1) && (Log() << Verbose(1) << "No ring containing " << *BFS.Root << " with length equal to or smaller than " << MinimumRingSize[Walker->GetTrueFather()->nr] << " found." << endl);
[ef9aae]828 }
829};
830
[9eefda]831/** From a given node performs a BFS to touch the next cycle, for whose nodes \a *&MinimumRingSize is set and set it accordingly.
832 * \param *out output stream for debugging
833 * \param *&Root node to look for closest cycle from, i.e. \a *&MinimumRingSize is set for this node
834 * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
835 * \param AtomCount number of nodes in graph
836 */
[e138de]837void CyclicStructureAnalysis_BFSToNextCycle(atom *&Root, atom *&Walker, int *&MinimumRingSize, int AtomCount)
[ef9aae]838{
[9eefda]839 struct BFSAccounting BFS;
[ef9aae]840 atom *OtherAtom = Walker;
841
[e138de]842 InitializeBFSAccounting(BFS, AtomCount);
[ef9aae]843
[e138de]844 ResetBFSAccounting(Walker, BFS);
[9eefda]845 while (OtherAtom != NULL) { // look for Root
846 Walker = BFS.BFSStack->PopFirst();
[e138de]847 //Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *Root << "." << endl;
[ef9aae]848 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
[9eefda]849 // "removed (*Runner) != BackEdge) || " from next if, is u
850 if ((Walker->ListOfBonds.size() == 1)) { // only walk along DFS spanning tree (otherwise we always find SP of 1 being backedge Binder), but terminal hydrogens may be connected via backedge, hence extra check
[ef9aae]851 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[e138de]852 //Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->Name << " for bond " << *Binder << "." << endl;
[9eefda]853 if (BFS.ColorList[OtherAtom->nr] == white) {
854 BFS.TouchedStack->Push(OtherAtom);
855 BFS.ColorList[OtherAtom->nr] = lightgray;
856 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
857 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[e138de]858 //Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->Name << " lightgray, its predecessor is " << Walker->Name << " and its Shortest Path is " << ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl;
[ef9aae]859 if (OtherAtom->GetTrueFather()->IsCyclic) { // if the other atom is connected to a ring
[9eefda]860 MinimumRingSize[Root->GetTrueFather()->nr] = BFS.ShortestPathList[OtherAtom->nr] + MinimumRingSize[OtherAtom->GetTrueFather()->nr];
[ef9aae]861 OtherAtom = NULL; //break;
862 break;
863 } else
[9eefda]864 BFS.BFSStack->Push(OtherAtom);
[ef9aae]865 } else {
[e138de]866 //Log() << Verbose(3) << "Not Adding, has already been visited." << endl;
[ef9aae]867 }
868 } else {
[e138de]869 //Log() << Verbose(3) << "Not Visiting, is a back edge." << endl;
[ef9aae]870 }
871 }
[9eefda]872 BFS.ColorList[Walker->nr] = black;
[e138de]873 //Log() << Verbose(1) << "Coloring Walker " << Walker->Name << " black." << endl;
[ef9aae]874 }
875 //CleanAccountingLists(TouchedStack, PredecessorList, ShortestPathList, ColorList);
876
[e138de]877 FinalizeBFSAccounting(BFS);
[9eefda]878}
879;
[ef9aae]880
[9eefda]881/** All nodes that are not in cycles get assigned a \a *&MinimumRingSizeby BFS to next cycle.
882 * \param *out output stream for debugging
883 * \param *&MinimumRingSize array with minimum distance without encountering onself for each atom
884 * \param &MinRingSize global minium distance
885 * \param &NumCyles number of cycles in graph
886 * \param *mol molecule with atoms
887 */
[e138de]888void CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(int *&MinimumRingSize, int &MinRingSize, int &NumCycles, const molecule * const mol)
[ef9aae]889{
[9eefda]890 atom *Root = NULL;
[ef9aae]891 atom *Walker = NULL;
892 if (MinRingSize != -1) { // if rings are present
893 // go over all atoms
[9879f6]894 for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
895 Root = *iter;
[ef9aae]896
[ea7176]897 if (MinimumRingSize[Root->GetTrueFather()->nr] == mol->getAtomCount()) { // check whether MinimumRingSize is set, if not BFS to next where it is
[ef9aae]898 Walker = Root;
899
[e138de]900 //Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl;
[ea7176]901 CyclicStructureAnalysis_BFSToNextCycle(Root, Walker, MinimumRingSize, mol->getAtomCount());
[ef9aae]902
903 }
[a67d19]904 DoLog(1) && (Log() << Verbose(1) << "Minimum ring size of " << *Root << " is " << MinimumRingSize[Root->GetTrueFather()->nr] << "." << endl);
[ef9aae]905 }
[a67d19]906 DoLog(1) && (Log() << Verbose(1) << "Minimum ring size is " << MinRingSize << ", over " << NumCycles << " cycles total." << endl);
[ef9aae]907 } else
[a67d19]908 DoLog(1) && (Log() << Verbose(1) << "No rings were detected in the molecular structure." << endl);
[9eefda]909}
910;
[ef9aae]911
[cee0b57]912/** Analyses the cycles found and returns minimum of all cycle lengths.
913 * We begin with a list of Back edges found during DepthFirstSearchAnalysis(). We go through this list - one end is the Root,
914 * the other our initial Walker - and do a Breadth First Search for the Root. We mark down each Predecessor and as soon as
915 * we have found the Root via BFS, we may climb back the closed cycle via the Predecessors. Thereby we mark atoms and bonds
916 * as cyclic and print out the cycles.
917 * \param *out output stream for debugging
918 * \param *BackEdgeStack stack with all back edges found during DFS scan. Beware: This stack contains the bonds from the total molecule, not from the subgraph!
919 * \param *&MinimumRingSize contains smallest ring size in molecular structure on return or -1 if no rings were found, if set is maximum search distance
920 * \todo BFS from the not-same-LP to find back to starting point of tributary cycle over more than one bond
921 */
[e138de]922void molecule::CyclicStructureAnalysis(class StackClass<bond *> * BackEdgeStack, int *&MinimumRingSize) const
[cee0b57]923{
[9eefda]924 struct BFSAccounting BFS;
[ef9aae]925 atom *Walker = NULL;
926 atom *OtherAtom = NULL;
927 bond *BackEdge = NULL;
928 int NumCycles = 0;
929 int MinRingSize = -1;
[cee0b57]930
[ea7176]931 InitializeBFSAccounting(BFS, getAtomCount());
[cee0b57]932
[e138de]933 //Log() << Verbose(1) << "Back edge list - ";
[99593f]934 //BackEdgeStack->Output(out);
[cee0b57]935
[a67d19]936 DoLog(1) && (Log() << Verbose(1) << "Analysing cycles ... " << endl);
[cee0b57]937 NumCycles = 0;
938 while (!BackEdgeStack->IsEmpty()) {
939 BackEdge = BackEdgeStack->PopFirst();
940 // this is the target
[9eefda]941 BFS.Root = BackEdge->leftatom;
[cee0b57]942 // this is the source point
943 Walker = BackEdge->rightatom;
944
[e138de]945 ResetBFSAccounting(Walker, BFS);
[cee0b57]946
[a67d19]947 DoLog(1) && (Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl);
[ef9aae]948 OtherAtom = NULL;
[e138de]949 CyclicStructureAnalysis_CyclicBFSFromRootToRoot(BackEdge, BFS);
[cee0b57]950
[e138de]951 CyclicStructureAnalysis_RetrieveCycleMembers(OtherAtom, BackEdge, BFS, MinimumRingSize, MinRingSize);
[cee0b57]952
[e138de]953 CleanBFSAccounting(BFS);
[ef9aae]954 }
[e138de]955 FinalizeBFSAccounting(BFS);
[ef9aae]956
[e138de]957 CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(MinimumRingSize, MinRingSize, NumCycles, this);
[fa649a]958};
[cee0b57]959
960/** Sets the next component number.
961 * This is O(N) as the number of bonds per atom is bound.
962 * \param *vertex atom whose next atom::*ComponentNr is to be set
963 * \param nr number to use
964 */
[fa649a]965void molecule::SetNextComponentNumber(atom *vertex, int nr) const
[cee0b57]966{
[9eefda]967 size_t i = 0;
[cee0b57]968 if (vertex != NULL) {
[9eefda]969 for (; i < vertex->ListOfBonds.size(); i++) {
970 if (vertex->ComponentNr[i] == -1) { // check if not yet used
[cee0b57]971 vertex->ComponentNr[i] = nr;
972 break;
[9eefda]973 } else if (vertex->ComponentNr[i] == nr) // if number is already present, don't add another time
974 break; // breaking here will not cause error!
[cee0b57]975 }
[e359a8]976 if (i == vertex->ListOfBonds.size()) {
[58ed4a]977 DoeLog(0) && (eLog()<< Verbose(0) << "Error: All Component entries are already occupied!" << endl);
[e359a8]978 performCriticalExit();
979 }
980 } else {
[58ed4a]981 DoeLog(0) && (eLog()<< Verbose(0) << "Error: Given vertex is NULL!" << endl);
[e359a8]982 performCriticalExit();
983 }
[9eefda]984}
985;
[cee0b57]986
987/** Returns next unused bond for this atom \a *vertex or NULL of none exists.
988 * \param *vertex atom to regard
989 * \return bond class or NULL
990 */
[fa649a]991bond * molecule::FindNextUnused(atom *vertex) const
[cee0b57]992{
[266237]993 for (BondList::const_iterator Runner = vertex->ListOfBonds.begin(); Runner != vertex->ListOfBonds.end(); (++Runner))
994 if ((*Runner)->IsUsed() == white)
[9eefda]995 return ((*Runner));
[cee0b57]996 return NULL;
[9eefda]997}
998;
[cee0b57]999
1000/** Resets bond::Used flag of all bonds in this molecule.
1001 * \return true - success, false - -failure
1002 */
[fa649a]1003void molecule::ResetAllBondsToUnused() const
[cee0b57]1004{
[e08c46]1005 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
1006 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
1007 if ((*BondRunner)->leftatom == *AtomRunner)
1008 (*BondRunner)->ResetUsed();
[9eefda]1009}
1010;
[cee0b57]1011
1012/** Output a list of flags, stating whether the bond was visited or not.
1013 * \param *out output stream for debugging
1014 * \param *list
1015 */
[e138de]1016void OutputAlreadyVisited(int *list)
[cee0b57]1017{
[a67d19]1018 DoLog(4) && (Log() << Verbose(4) << "Already Visited Bonds:\t");
[9eefda]1019 for (int i = 1; i <= list[0]; i++)
[a67d19]1020 DoLog(0) && (Log() << Verbose(0) << list[i] << " ");
1021 DoLog(0) && (Log() << Verbose(0) << endl);
[9eefda]1022}
1023;
[cee0b57]1024
1025/** Storing the bond structure of a molecule to file.
1026 * Simply stores Atom::nr and then the Atom::nr of all bond partners per line.
[35b698]1027 * \param &filename name of file
1028 * \param path path to file, defaults to empty
[cee0b57]1029 * \return true - file written successfully, false - writing failed
1030 */
[35b698]1031bool molecule::StoreAdjacencyToFile(std::string &filename, std::string path)
[cee0b57]1032{
1033 ofstream AdjacencyFile;
[35b698]1034 string line;
[cee0b57]1035 bool status = true;
1036
[35b698]1037 if (path != "")
1038 line = path + "/" + filename;
[8ab0407]1039 else
[35b698]1040 line = filename;
1041 AdjacencyFile.open(line.c_str(), ios::out);
[acf800]1042 DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
[35b698]1043 if (AdjacencyFile.good()) {
[1f1b23]1044 AdjacencyFile << "m\tn" << endl;
[9eefda]1045 ActOnAllAtoms(&atom::OutputAdjacency, &AdjacencyFile);
[cee0b57]1046 AdjacencyFile.close();
[acf800]1047 DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
[cee0b57]1048 } else {
[35b698]1049 DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
[cee0b57]1050 status = false;
1051 }
1052
1053 return status;
[9eefda]1054}
1055;
[cee0b57]1056
[1f1b23]1057/** Storing the bond structure of a molecule to file.
1058 * Simply stores Atom::nr and then the Atom::nr of all bond partners, one per line.
[35b698]1059 * \param &filename name of file
1060 * \param path path to file, defaults to empty
[1f1b23]1061 * \return true - file written successfully, false - writing failed
1062 */
[35b698]1063bool molecule::StoreBondsToFile(std::string &filename, std::string path)
[1f1b23]1064{
1065 ofstream BondFile;
[35b698]1066 string line;
[1f1b23]1067 bool status = true;
1068
[35b698]1069 if (path != "")
1070 line = path + "/" + filename;
[8ab0407]1071 else
[35b698]1072 line = filename;
1073 BondFile.open(line.c_str(), ios::out);
[acf800]1074 DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
[35b698]1075 if (BondFile.good()) {
[1f1b23]1076 BondFile << "m\tn" << endl;
1077 ActOnAllAtoms(&atom::OutputBonds, &BondFile);
1078 BondFile.close();
[acf800]1079 DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
[1f1b23]1080 } else {
[35b698]1081 DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
[1f1b23]1082 status = false;
1083 }
1084
1085 return status;
1086}
1087;
1088
[35b698]1089bool CheckAdjacencyFileAgainstMolecule_Init(std::string &path, ifstream &File, int *&CurrentBonds)
[ba4170]1090{
[35b698]1091 string filename;
1092 filename = path + ADJACENCYFILE;
1093 File.open(filename.c_str(), ios::out);
[0de7e8]1094 DoLog(1) && (Log() << Verbose(1) << "Looking at bond structure stored in adjacency file and comparing to present one ... " << endl);
[35b698]1095 if (File.fail())
[ba4170]1096 return false;
1097
1098 // allocate storage structure
[920c70]1099 CurrentBonds = new int[8]; // contains parsed bonds of current atom
1100 for(int i=0;i<8;i++)
1101 CurrentBonds[i] = 0;
[ba4170]1102 return true;
[9eefda]1103}
1104;
[ba4170]1105
[e138de]1106void CheckAdjacencyFileAgainstMolecule_Finalize(ifstream &File, int *&CurrentBonds)
[ba4170]1107{
1108 File.close();
1109 File.clear();
[920c70]1110 delete[](CurrentBonds);
[9eefda]1111}
1112;
[ba4170]1113
[e138de]1114void CheckAdjacencyFileAgainstMolecule_CompareBonds(bool &status, int &NonMatchNumber, atom *&Walker, size_t &CurrentBondsOfAtom, int AtomNr, int *&CurrentBonds, atom **ListOfAtoms)
[ba4170]1115{
1116 size_t j = 0;
1117 int id = -1;
1118
[e138de]1119 //Log() << Verbose(2) << "Walker is " << *Walker << ", bond partners: ";
[ba4170]1120 if (CurrentBondsOfAtom == Walker->ListOfBonds.size()) {
1121 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1122 id = (*Runner)->GetOtherAtom(Walker)->nr;
1123 j = 0;
[9eefda]1124 for (; (j < CurrentBondsOfAtom) && (CurrentBonds[j++] != id);)
[ba4170]1125 ; // check against all parsed bonds
[9eefda]1126 if (CurrentBonds[j - 1] != id) { // no match ? Then mark in ListOfAtoms
[ba4170]1127 ListOfAtoms[AtomNr] = NULL;
1128 NonMatchNumber++;
1129 status = false;
[0de7e8]1130 DoeLog(2) && (eLog() << Verbose(2) << id << " can not be found in list." << endl);
[ba4170]1131 } else {
[0de7e8]1132 //Log() << Verbose(0) << "[" << id << "]\t";
[ba4170]1133 }
1134 }
[e138de]1135 //Log() << Verbose(0) << endl;
[ba4170]1136 } else {
[a67d19]1137 DoLog(0) && (Log() << Verbose(0) << "Number of bonds for Atom " << *Walker << " does not match, parsed " << CurrentBondsOfAtom << " against " << Walker->ListOfBonds.size() << "." << endl);
[ba4170]1138 status = false;
1139 }
[9eefda]1140}
1141;
[ba4170]1142
[cee0b57]1143/** Checks contents of adjacency file against bond structure in structure molecule.
1144 * \param *out output stream for debugging
1145 * \param *path path to file
1146 * \param **ListOfAtoms allocated (molecule::AtomCount) and filled lookup table for ids (Atom::nr) to *Atom
1147 * \return true - structure is equal, false - not equivalence
1148 */
[35b698]1149bool molecule::CheckAdjacencyFileAgainstMolecule(std::string &path, atom **ListOfAtoms)
[cee0b57]1150{
1151 ifstream File;
1152 bool status = true;
[266237]1153 atom *Walker = NULL;
[ba4170]1154 int *CurrentBonds = NULL;
[9eefda]1155 int NonMatchNumber = 0; // will number of atoms with differing bond structure
[ba4170]1156 size_t CurrentBondsOfAtom = -1;
[0de7e8]1157 const int AtomCount = getAtomCount();
[cee0b57]1158
[e138de]1159 if (!CheckAdjacencyFileAgainstMolecule_Init(path, File, CurrentBonds)) {
[a67d19]1160 DoLog(1) && (Log() << Verbose(1) << "Adjacency file not found." << endl);
[ba4170]1161 return true;
1162 }
1163
[920c70]1164 char buffer[MAXSTRINGSIZE];
[ba4170]1165 // Parse the file line by line and count the bonds
1166 while (!File.eof()) {
1167 File.getline(buffer, MAXSTRINGSIZE);
1168 stringstream line;
1169 line.str(buffer);
1170 int AtomNr = -1;
1171 line >> AtomNr;
1172 CurrentBondsOfAtom = -1; // we count one too far due to line end
1173 // parse into structure
[0de7e8]1174 if ((AtomNr >= 0) && (AtomNr < AtomCount)) {
[ba4170]1175 Walker = ListOfAtoms[AtomNr];
1176 while (!line.eof())
[9eefda]1177 line >> CurrentBonds[++CurrentBondsOfAtom];
[ba4170]1178 // compare against present bonds
[e138de]1179 CheckAdjacencyFileAgainstMolecule_CompareBonds(status, NonMatchNumber, Walker, CurrentBondsOfAtom, AtomNr, CurrentBonds, ListOfAtoms);
[0de7e8]1180 } else {
1181 if (AtomNr != -1)
1182 DoeLog(2) && (eLog() << Verbose(2) << AtomNr << " is not valid in the range of ids [" << 0 << "," << AtomCount << ")." << endl);
[ba4170]1183 }
[cee0b57]1184 }
[e138de]1185 CheckAdjacencyFileAgainstMolecule_Finalize(File, CurrentBonds);
[cee0b57]1186
[ba4170]1187 if (status) { // if equal we parse the KeySetFile
[a67d19]1188 DoLog(1) && (Log() << Verbose(1) << "done: Equal." << endl);
[ba4170]1189 } else
[a67d19]1190 DoLog(1) && (Log() << Verbose(1) << "done: Not equal by " << NonMatchNumber << " atoms." << endl);
[cee0b57]1191 return status;
[9eefda]1192}
1193;
[cee0b57]1194
1195/** Picks from a global stack with all back edges the ones in the fragment.
1196 * \param *out output stream for debugging
1197 * \param **ListOfLocalAtoms array of father atom::nr to local atom::nr (reverse of atom::father)
1198 * \param *ReferenceStack stack with all the back egdes
1199 * \param *LocalStack stack to be filled
1200 * \return true - everything ok, false - ReferenceStack was empty
1201 */
[e138de]1202bool molecule::PickLocalBackEdges(atom **ListOfLocalAtoms, class StackClass<bond *> *&ReferenceStack, class StackClass<bond *> *&LocalStack) const
[cee0b57]1203{
1204 bool status = true;
1205 if (ReferenceStack->IsEmpty()) {
[a67d19]1206 DoLog(1) && (Log() << Verbose(1) << "ReferenceStack is empty!" << endl);
[cee0b57]1207 return false;
1208 }
1209 bond *Binder = ReferenceStack->PopFirst();
[9eefda]1210 bond *FirstBond = Binder; // mark the first bond, so that we don't loop through the stack indefinitely
[cee0b57]1211 atom *Walker = NULL, *OtherAtom = NULL;
1212 ReferenceStack->Push(Binder);
1213
[9eefda]1214 do { // go through all bonds and push local ones
1215 Walker = ListOfLocalAtoms[Binder->leftatom->nr]; // get one atom in the reference molecule
[cee0b57]1216 if (Walker != NULL) // if this Walker exists in the subgraph ...
[266237]1217 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1218 OtherAtom = (*Runner)->GetOtherAtom(Walker);
1219 if (OtherAtom == ListOfLocalAtoms[(*Runner)->rightatom->nr]) { // found the bond
1220 LocalStack->Push((*Runner));
[a67d19]1221 DoLog(3) && (Log() << Verbose(3) << "Found local edge " << *(*Runner) << "." << endl);
[cee0b57]1222 break;
1223 }
1224 }
[9eefda]1225 Binder = ReferenceStack->PopFirst(); // loop the stack for next item
[a67d19]1226 DoLog(3) && (Log() << Verbose(3) << "Current candidate edge " << Binder << "." << endl);
[cee0b57]1227 ReferenceStack->Push(Binder);
1228 } while (FirstBond != Binder);
1229
1230 return status;
[9eefda]1231}
1232;
[ce7cc5]1233
1234void BreadthFirstSearchAdd_Init(struct BFSAccounting &BFS, atom *&Root, int AtomCount, int BondOrder, atom **AddedAtomList = NULL)
1235{
1236 BFS.AtomCount = AtomCount;
1237 BFS.BondOrder = BondOrder;
[920c70]1238 BFS.PredecessorList = new atom*[AtomCount];
1239 BFS.ShortestPathList = new int[AtomCount];
1240 BFS.ColorList = new enum Shading[AtomCount];
[9eefda]1241 BFS.BFSStack = new StackClass<atom *> (AtomCount);
[ce7cc5]1242
1243 BFS.Root = Root;
[9eefda]1244 BFS.BFSStack->ClearStack();
1245 BFS.BFSStack->Push(Root);
[ce7cc5]1246
1247 // initialise each vertex as white with no predecessor, empty queue, color Root lightgray
[9eefda]1248 for (int i = AtomCount; i--;) {
[920c70]1249 BFS.PredecessorList[i] = NULL;
[ce7cc5]1250 BFS.ShortestPathList[i] = -1;
1251 if ((AddedAtomList != NULL) && (AddedAtomList[i] != NULL)) // mark already present atoms (i.e. Root and maybe others) as visited
1252 BFS.ColorList[i] = lightgray;
1253 else
1254 BFS.ColorList[i] = white;
1255 }
[920c70]1256 //BFS.ShortestPathList[Root->nr] = 0; // done by Calloc
[9eefda]1257}
1258;
[ce7cc5]1259
1260void BreadthFirstSearchAdd_Free(struct BFSAccounting &BFS)
1261{
[920c70]1262 delete[](BFS.PredecessorList);
1263 delete[](BFS.ShortestPathList);
1264 delete[](BFS.ColorList);
[9eefda]1265 delete (BFS.BFSStack);
[ce7cc5]1266 BFS.AtomCount = 0;
[9eefda]1267}
1268;
[ce7cc5]1269
[e138de]1270void BreadthFirstSearchAdd_UnvisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
[ce7cc5]1271{
1272 if (Binder != Bond) // let other atom white if it's via Root bond. In case it's cyclic it has to be reached again (yet Root is from OtherAtom already black, thus no problem)
1273 BFS.ColorList[OtherAtom->nr] = lightgray;
[9eefda]1274 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
1275 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[68f03d]1276 DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " " << ((BFS.ColorList[OtherAtom->nr] == white) ? "white" : "lightgray") << ", its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
[9eefda]1277 if ((((BFS.ShortestPathList[OtherAtom->nr] < BFS.BondOrder) && (Binder != Bond)))) { // Check for maximum distance
[a67d19]1278 DoLog(3) && (Log() << Verbose(3));
[ce7cc5]1279 if (AddedAtomList[OtherAtom->nr] == NULL) { // add if it's not been so far
1280 AddedAtomList[OtherAtom->nr] = Mol->AddCopyAtom(OtherAtom);
[68f03d]1281 DoLog(0) && (Log() << Verbose(0) << "Added OtherAtom " << OtherAtom->getName());
[ce7cc5]1282 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
[a67d19]1283 DoLog(0) && (Log() << Verbose(0) << " and bond " << *(AddedBondList[Binder->nr]) << ", ");
[9eefda]1284 } else { // this code should actually never come into play (all white atoms are not yet present in BondMolecule, that's why they are white in the first place)
[68f03d]1285 DoLog(0) && (Log() << Verbose(0) << "Not adding OtherAtom " << OtherAtom->getName());
[ce7cc5]1286 if (AddedBondList[Binder->nr] == NULL) {
1287 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
[a67d19]1288 DoLog(0) && (Log() << Verbose(0) << ", added Bond " << *(AddedBondList[Binder->nr]));
[ce7cc5]1289 } else
[a67d19]1290 DoLog(0) && (Log() << Verbose(0) << ", not added Bond ");
[ce7cc5]1291 }
[a67d19]1292 DoLog(0) && (Log() << Verbose(0) << ", putting OtherAtom into queue." << endl);
[9eefda]1293 BFS.BFSStack->Push(OtherAtom);
[ce7cc5]1294 } else { // out of bond order, then replace
1295 if ((AddedAtomList[OtherAtom->nr] == NULL) && (Binder->Cyclic))
1296 BFS.ColorList[OtherAtom->nr] = white; // unmark if it has not been queued/added, to make it available via its other bonds (cyclic)
1297 if (Binder == Bond)
[a67d19]1298 DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is the Root bond");
[ce7cc5]1299 else if (BFS.ShortestPathList[OtherAtom->nr] >= BFS.BondOrder)
[a67d19]1300 DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is out of Bond Count of " << BFS.BondOrder);
[ce7cc5]1301 if (!Binder->Cyclic)
[a67d19]1302 DoLog(0) && (Log() << Verbose(0) << ", is not part of a cyclic bond, saturating bond with Hydrogen." << endl);
[ce7cc5]1303 if (AddedBondList[Binder->nr] == NULL) {
1304 if ((AddedAtomList[OtherAtom->nr] != NULL)) { // .. whether we add or saturate
1305 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
1306 } else {
[9eefda]1307#ifdef ADDHYDROGEN
[e138de]1308 if (!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
[9eefda]1309 exit(1);
1310#endif
[ce7cc5]1311 }
1312 }
1313 }
[9eefda]1314}
1315;
[ce7cc5]1316
[e138de]1317void BreadthFirstSearchAdd_VisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
[ce7cc5]1318{
[a67d19]1319 DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
[ce7cc5]1320 // This has to be a cyclic bond, check whether it's present ...
1321 if (AddedBondList[Binder->nr] == NULL) {
[9eefda]1322 if ((Binder != Bond) && (Binder->Cyclic) && (((BFS.ShortestPathList[Walker->nr] + 1) < BFS.BondOrder))) {
[ce7cc5]1323 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
1324 } else { // if it's root bond it has to broken (otherwise we would not create the fragments)
[9eefda]1325#ifdef ADDHYDROGEN
[e138de]1326 if(!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
[9eefda]1327 exit(1);
1328#endif
[ce7cc5]1329 }
1330 }
[9eefda]1331}
1332;
[cee0b57]1333
1334/** Adds atoms up to \a BondCount distance from \a *Root and notes them down in \a **AddedAtomList.
1335 * Gray vertices are always enqueued in an StackClass<atom *> FIFO queue, the rest is usual BFS with adding vertices found was
1336 * white and putting into queue.
1337 * \param *out output stream for debugging
1338 * \param *Mol Molecule class to add atoms to
1339 * \param **AddedAtomList list with added atom pointers, index is atom father's number
1340 * \param **AddedBondList list with added bond pointers, index is bond father's number
1341 * \param *Root root vertex for BFS
1342 * \param *Bond bond not to look beyond
1343 * \param BondOrder maximum distance for vertices to add
1344 * \param IsAngstroem lengths are in angstroem or bohrradii
1345 */
[e138de]1346void molecule::BreadthFirstSearchAdd(molecule *Mol, atom **&AddedAtomList, bond **&AddedBondList, atom *Root, bond *Bond, int BondOrder, bool IsAngstroem)
[cee0b57]1347{
[ce7cc5]1348 struct BFSAccounting BFS;
[cee0b57]1349 atom *Walker = NULL, *OtherAtom = NULL;
[ce7cc5]1350 bond *Binder = NULL;
[cee0b57]1351
1352 // add Root if not done yet
[9eefda]1353 if (AddedAtomList[Root->nr] == NULL) // add Root if not yet present
[cee0b57]1354 AddedAtomList[Root->nr] = Mol->AddCopyAtom(Root);
1355
[ea7176]1356 BreadthFirstSearchAdd_Init(BFS, Root, BondOrder, getAtomCount(), AddedAtomList);
[cee0b57]1357
1358 // and go on ... Queue always contains all lightgray vertices
[9eefda]1359 while (!BFS.BFSStack->IsEmpty()) {
[cee0b57]1360 // we have to pop the oldest atom from stack. This keeps the atoms on the stack always of the same ShortestPath distance.
1361 // e.g. if current atom is 2, push to end of stack are of length 3, but first all of length 2 would be popped. They again
1362 // append length of 3 (their neighbours). Thus on stack we have always atoms of a certain length n at bottom of stack and
1363 // followed by n+1 till top of stack.
[9eefda]1364 Walker = BFS.BFSStack->PopFirst(); // pop oldest added
[68f03d]1365 DoLog(1) && (Log() << Verbose(1) << "Current Walker is: " << Walker->getName() << ", and has " << Walker->ListOfBonds.size() << " bonds." << endl);
[266237]1366 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1367 if ((*Runner) != NULL) { // don't look at bond equal NULL
[ce7cc5]1368 Binder = (*Runner);
[266237]1369 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[68f03d]1370 DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
[ce7cc5]1371 if (BFS.ColorList[OtherAtom->nr] == white) {
[e138de]1372 BreadthFirstSearchAdd_UnvisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
[cee0b57]1373 } else {
[e138de]1374 BreadthFirstSearchAdd_VisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
[cee0b57]1375 }
1376 }
1377 }
[ce7cc5]1378 BFS.ColorList[Walker->nr] = black;
[68f03d]1379 DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
[cee0b57]1380 }
[ce7cc5]1381 BreadthFirstSearchAdd_Free(BFS);
[9eefda]1382}
1383;
[cee0b57]1384
[266237]1385/** Adds a bond as a copy to a given one
1386 * \param *left leftatom of new bond
1387 * \param *right rightatom of new bond
1388 * \param *CopyBond rest of fields in bond are copied from this
1389 * \return pointer to new bond
1390 */
1391bond * molecule::CopyBond(atom *left, atom *right, bond *CopyBond)
1392{
1393 bond *Binder = AddBond(left, right, CopyBond->BondDegree);
1394 Binder->Cyclic = CopyBond->Cyclic;
1395 Binder->Type = CopyBond->Type;
1396 return Binder;
[9eefda]1397}
1398;
[266237]1399
[e138de]1400void BuildInducedSubgraph_Init(atom **&ParentList, int AtomCount)
[cee0b57]1401{
1402 // reset parent list
[920c70]1403 ParentList = new atom*[AtomCount];
1404 for (int i=0;i<AtomCount;i++)
1405 ParentList[i] = NULL;
[a67d19]1406 DoLog(3) && (Log() << Verbose(3) << "Resetting ParentList." << endl);
[9eefda]1407}
1408;
[cee0b57]1409
[e138de]1410void BuildInducedSubgraph_FillParentList(const molecule *mol, const molecule *Father, atom **&ParentList)
[43587e]1411{
[cee0b57]1412 // fill parent list with sons
[a67d19]1413 DoLog(3) && (Log() << Verbose(3) << "Filling Parent List." << endl);
[9879f6]1414 for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
1415 ParentList[(*iter)->father->nr] = (*iter);
[cee0b57]1416 // Outputting List for debugging
[a7b761b]1417 DoLog(4) && (Log() << Verbose(4) << "Son[" << (*iter)->father->nr << "] of " << (*iter)->father << " is " << ParentList[(*iter)->father->nr] << "." << endl);
[cee0b57]1418 }
[a7b761b]1419};
[43587e]1420
[e138de]1421void BuildInducedSubgraph_Finalize(atom **&ParentList)
[43587e]1422{
[920c70]1423 delete[](ParentList);
[9eefda]1424}
1425;
[43587e]1426
[e138de]1427bool BuildInducedSubgraph_CreateBondsFromParent(molecule *mol, const molecule *Father, atom **&ParentList)
[43587e]1428{
1429 bool status = true;
1430 atom *OtherAtom = NULL;
[cee0b57]1431 // check each entry of parent list and if ok (one-to-and-onto matching) create bonds
[a67d19]1432 DoLog(3) && (Log() << Verbose(3) << "Creating bonds." << endl);
[9879f6]1433 for (molecule::const_iterator iter = Father->begin(); iter != Father->end(); ++iter) {
1434 if (ParentList[(*iter)->nr] != NULL) {
1435 if (ParentList[(*iter)->nr]->father != (*iter)) {
[cee0b57]1436 status = false;
1437 } else {
[9879f6]1438 for (BondList::const_iterator Runner = (*iter)->ListOfBonds.begin(); Runner != (*iter)->ListOfBonds.end(); (++Runner)) {
1439 OtherAtom = (*Runner)->GetOtherAtom((*iter));
[cee0b57]1440 if (ParentList[OtherAtom->nr] != NULL) { // if otheratom is also a father of an atom on this molecule, create the bond
[a7b761b]1441 DoLog(4) && (Log() << Verbose(4) << "Endpoints of Bond " << (*Runner) << " are both present: " << ParentList[(*iter)->nr]->getName() << " and " << ParentList[OtherAtom->nr]->getName() << "." << endl);
[9879f6]1442 mol->AddBond(ParentList[(*iter)->nr], ParentList[OtherAtom->nr], (*Runner)->BondDegree);
[cee0b57]1443 }
1444 }
1445 }
1446 }
1447 }
[43587e]1448 return status;
[9eefda]1449}
1450;
[cee0b57]1451
[43587e]1452/** Adds bond structure to this molecule from \a Father molecule.
1453 * This basically causes this molecule to become an induced subgraph of the \a Father, i.e. for every bond in Father
1454 * with end points present in this molecule, bond is created in this molecule.
1455 * Special care was taken to ensure that this is of complexity O(N), where N is the \a Father's molecule::AtomCount.
1456 * \param *out output stream for debugging
1457 * \param *Father father molecule
1458 * \return true - is induced subgraph, false - there are atoms with fathers not in \a Father
1459 * \todo not checked, not fully working probably
1460 */
[e138de]1461bool molecule::BuildInducedSubgraph(const molecule *Father)
[43587e]1462{
1463 bool status = true;
1464 atom **ParentList = NULL;
[a67d19]1465 DoLog(2) && (Log() << Verbose(2) << "Begin of BuildInducedSubgraph." << endl);
[ea7176]1466 BuildInducedSubgraph_Init(ParentList, Father->getAtomCount());
[e138de]1467 BuildInducedSubgraph_FillParentList(this, Father, ParentList);
1468 status = BuildInducedSubgraph_CreateBondsFromParent(this, Father, ParentList);
1469 BuildInducedSubgraph_Finalize(ParentList);
[a67d19]1470 DoLog(2) && (Log() << Verbose(2) << "End of BuildInducedSubgraph." << endl);
[cee0b57]1471 return status;
[9eefda]1472}
1473;
[cee0b57]1474
1475/** For a given keyset \a *Fragment, checks whether it is connected in the current molecule.
1476 * \param *out output stream for debugging
1477 * \param *Fragment Keyset of fragment's vertices
1478 * \return true - connected, false - disconnected
1479 * \note this is O(n^2) for it's just a bug checker not meant for permanent use!
1480 */
[e138de]1481bool molecule::CheckForConnectedSubgraph(KeySet *Fragment)
[cee0b57]1482{
1483 atom *Walker = NULL, *Walker2 = NULL;
1484 bool BondStatus = false;
1485 int size;
1486
[a67d19]1487 DoLog(1) && (Log() << Verbose(1) << "Begin of CheckForConnectedSubgraph" << endl);
1488 DoLog(2) && (Log() << Verbose(2) << "Disconnected atom: ");
[cee0b57]1489
1490 // count number of atoms in graph
1491 size = 0;
[9eefda]1492 for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++)
[cee0b57]1493 size++;
1494 if (size > 1)
[9eefda]1495 for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++) {
[cee0b57]1496 Walker = FindAtom(*runner);
1497 BondStatus = false;
[9eefda]1498 for (KeySet::iterator runners = Fragment->begin(); runners != Fragment->end(); runners++) {
[cee0b57]1499 Walker2 = FindAtom(*runners);
[266237]1500 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1501 if ((*Runner)->GetOtherAtom(Walker) == Walker2) {
[cee0b57]1502 BondStatus = true;
1503 break;
1504 }
1505 if (BondStatus)
1506 break;
1507 }
1508 }
1509 if (!BondStatus) {
[a67d19]1510 DoLog(0) && (Log() << Verbose(0) << (*Walker) << endl);
[cee0b57]1511 return false;
1512 }
1513 }
1514 else {
[a67d19]1515 DoLog(0) && (Log() << Verbose(0) << "none." << endl);
[cee0b57]1516 return true;
1517 }
[a67d19]1518 DoLog(0) && (Log() << Verbose(0) << "none." << endl);
[cee0b57]1519
[a67d19]1520 DoLog(1) && (Log() << Verbose(1) << "End of CheckForConnectedSubgraph" << endl);
[cee0b57]1521
1522 return true;
1523}
Note: See TracBrowser for help on using the repository browser.