[bcf653] | 1 | /*
|
---|
| 2 | * Project: MoleCuilder
|
---|
| 3 | * Description: creates and alters molecular systems
|
---|
| 4 | * Copyright (C) 2010 University of Bonn. All rights reserved.
|
---|
| 5 | * Please see the LICENSE file or "Copyright notice" in builder.cpp for details.
|
---|
| 6 | */
|
---|
| 7 |
|
---|
[cee0b57] | 8 | /*
|
---|
| 9 | * molecule_graph.cpp
|
---|
| 10 | *
|
---|
| 11 | * Created on: Oct 5, 2009
|
---|
| 12 | * Author: heber
|
---|
| 13 | */
|
---|
| 14 |
|
---|
[bf3817] | 15 | // include config.h
|
---|
[aafd77] | 16 | #ifdef HAVE_CONFIG_H
|
---|
| 17 | #include <config.h>
|
---|
| 18 | #endif
|
---|
| 19 |
|
---|
[112b09] | 20 | #include "Helpers/MemDebug.hpp"
|
---|
| 21 |
|
---|
[f66195] | 22 | #include "atom.hpp"
|
---|
| 23 | #include "bond.hpp"
|
---|
[b70721] | 24 | #include "bondgraph.hpp"
|
---|
[cee0b57] | 25 | #include "config.hpp"
|
---|
[35b698] | 26 | #include "defs.hpp"
|
---|
[f66195] | 27 | #include "element.hpp"
|
---|
[952f38] | 28 | #include "Helpers/helpers.hpp"
|
---|
| 29 | #include "Helpers/Info.hpp"
|
---|
[b8b75d] | 30 | #include "linkedcell.hpp"
|
---|
[f66195] | 31 | #include "lists.hpp"
|
---|
[952f38] | 32 | #include "Helpers/Verbose.hpp"
|
---|
| 33 | #include "Helpers/Log.hpp"
|
---|
[cee0b57] | 34 | #include "molecule.hpp"
|
---|
[b34306] | 35 | #include "World.hpp"
|
---|
[0a4f7f] | 36 | #include "Helpers/fast_functions.hpp"
|
---|
[f2bb0f] | 37 | #include "Helpers/Assert.hpp"
|
---|
[57f243] | 38 | #include "LinearAlgebra/Matrix.hpp"
|
---|
[84c494] | 39 | #include "Box.hpp"
|
---|
[36166d] | 40 | #include "stackclass.hpp"
|
---|
[cee0b57] | 41 |
|
---|
[9eefda] | 42 | struct BFSAccounting
|
---|
| 43 | {
|
---|
| 44 | atom **PredecessorList;
|
---|
| 45 | int *ShortestPathList;
|
---|
| 46 | enum Shading *ColorList;
|
---|
| 47 | class StackClass<atom *> *BFSStack;
|
---|
| 48 | class StackClass<atom *> *TouchedStack;
|
---|
| 49 | int AtomCount;
|
---|
| 50 | int BondOrder;
|
---|
| 51 | atom *Root;
|
---|
| 52 | bool BackStepping;
|
---|
| 53 | int CurrentGraphNr;
|
---|
| 54 | int ComponentNr;
|
---|
| 55 | };
|
---|
[cee0b57] | 56 |
|
---|
[9eefda] | 57 | /** Accounting data for Depth First Search.
|
---|
| 58 | */
|
---|
| 59 | struct DFSAccounting
|
---|
| 60 | {
|
---|
| 61 | class StackClass<atom *> *AtomStack;
|
---|
| 62 | class StackClass<bond *> *BackEdgeStack;
|
---|
| 63 | int CurrentGraphNr;
|
---|
| 64 | int ComponentNumber;
|
---|
| 65 | atom *Root;
|
---|
| 66 | bool BackStepping;
|
---|
| 67 | };
|
---|
| 68 |
|
---|
| 69 | /************************************* Functions for class molecule *********************************/
|
---|
[cee0b57] | 70 |
|
---|
| 71 | /** Creates an adjacency list of the molecule.
|
---|
| 72 | * We obtain an outside file with the indices of atoms which are bondmembers.
|
---|
| 73 | */
|
---|
[e138de] | 74 | void molecule::CreateAdjacencyListFromDbondFile(ifstream *input)
|
---|
[cee0b57] | 75 | {
|
---|
[c68c90] | 76 | Info FunctionInfo(__func__);
|
---|
[cee0b57] | 77 | // 1 We will parse bonds out of the dbond file created by tremolo.
|
---|
[44a59b] | 78 | int atom1, atom2;
|
---|
| 79 | atom *Walker, *OtherWalker;
|
---|
[c68c90] | 80 | char line[MAXSTRINGSIZE];
|
---|
[44a59b] | 81 |
|
---|
[c68c90] | 82 | if (input->fail()) {
|
---|
| 83 | DoeLog(0) && (eLog() << Verbose(0) << "Opening of bond file failed \n");
|
---|
| 84 | performCriticalExit();
|
---|
[44a59b] | 85 | };
|
---|
[bd6bfa] | 86 | doCountAtoms();
|
---|
[44a59b] | 87 |
|
---|
[c68c90] | 88 | // skip header
|
---|
| 89 | input->getline(line,MAXSTRINGSIZE);
|
---|
| 90 | DoLog(1) && (Log() << Verbose(1) << "Scanning file ... \n");
|
---|
[44a59b] | 91 | while (!input->eof()) // Check whether we read everything already
|
---|
| 92 | {
|
---|
[c68c90] | 93 | input->getline(line,MAXSTRINGSIZE);
|
---|
| 94 | stringstream zeile(line);
|
---|
| 95 | zeile >> atom1;
|
---|
| 96 | zeile >> atom2;
|
---|
[44a59b] | 97 |
|
---|
[c68c90] | 98 | DoLog(2) && (Log() << Verbose(2) << "Looking for atoms " << atom1 << " and " << atom2 << "." << endl);
|
---|
[9eefda] | 99 | if (atom2 < atom1) //Sort indices of atoms in order
|
---|
[44a59b] | 100 | flip(atom1, atom2);
|
---|
[9eefda] | 101 | Walker = FindAtom(atom1);
|
---|
[05a97c] | 102 | ASSERT(Walker,"Could not find an atom with the ID given in dbond file");
|
---|
[9eefda] | 103 | OtherWalker = FindAtom(atom2);
|
---|
[05a97c] | 104 | ASSERT(OtherWalker,"Could not find an atom with the ID given in dbond file");
|
---|
[44a59b] | 105 | AddBond(Walker, OtherWalker); //Add the bond between the two atoms with respective indices.
|
---|
| 106 | }
|
---|
[9eefda] | 107 | }
|
---|
| 108 | ;
|
---|
[cee0b57] | 109 |
|
---|
| 110 | /** Creates an adjacency list of the molecule.
|
---|
| 111 | * Generally, we use the CSD approach to bond recognition, that is the the distance
|
---|
| 112 | * between two atoms A and B must be within [Rcov(A)+Rcov(B)-t,Rcov(A)+Rcov(B)+t] with
|
---|
| 113 | * a threshold t = 0.4 Angstroem.
|
---|
| 114 | * To make it O(N log N) the function uses the linked-cell technique as follows:
|
---|
| 115 | * The procedure is step-wise:
|
---|
| 116 | * -# Remove every bond in list
|
---|
| 117 | * -# Count the atoms in the molecule with CountAtoms()
|
---|
| 118 | * -# partition cell into smaller linked cells of size \a bonddistance
|
---|
| 119 | * -# put each atom into its corresponding cell
|
---|
| 120 | * -# go through every cell, check the atoms therein against all possible bond partners in the 27 adjacent cells, add bond if true
|
---|
| 121 | * -# correct the bond degree iteratively (single->double->triple bond)
|
---|
| 122 | * -# finally print the bond list to \a *out if desired
|
---|
| 123 | * \param *out out stream for printing the matrix, NULL if no output
|
---|
| 124 | * \param bonddistance length of linked cells (i.e. maximum minimal length checked)
|
---|
| 125 | * \param IsAngstroem whether coordinate system is gauged to Angstroem or Bohr radii
|
---|
[b70721] | 126 | * \param *minmaxdistance function to give upper and lower bound on whether particle is bonded to some other
|
---|
| 127 | * \param *BG BondGraph with the member function above or NULL, if just standard covalent should be used.
|
---|
[cee0b57] | 128 | */
|
---|
[e138de] | 129 | void molecule::CreateAdjacencyList(double bonddistance, bool IsAngstroem, void (BondGraph::*minmaxdistance)(BondedParticle * const , BondedParticle * const , double &, double &, bool), BondGraph *BG)
|
---|
[cee0b57] | 130 | {
|
---|
[b8b75d] | 131 | atom *Walker = NULL;
|
---|
| 132 | atom *OtherWalker = NULL;
|
---|
| 133 | int n[NDIM];
|
---|
[b70721] | 134 | double MinDistance, MaxDistance;
|
---|
[b8b75d] | 135 | LinkedCell *LC = NULL;
|
---|
[b70721] | 136 | bool free_BG = false;
|
---|
[014475] | 137 | Box &domain = World::getInstance().getDomain();
|
---|
[b70721] | 138 |
|
---|
| 139 | if (BG == NULL) {
|
---|
| 140 | BG = new BondGraph(IsAngstroem);
|
---|
| 141 | free_BG = true;
|
---|
| 142 | }
|
---|
[cee0b57] | 143 |
|
---|
| 144 | BondDistance = bonddistance; // * ((IsAngstroem) ? 1. : 1./AtomicLengthToAngstroem);
|
---|
[a67d19] | 145 | DoLog(0) && (Log() << Verbose(0) << "Begin of CreateAdjacencyList." << endl);
|
---|
[cee0b57] | 146 | // remove every bond from the list
|
---|
[e08c46] | 147 | for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 148 | for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); !(*AtomRunner)->ListOfBonds.empty(); BondRunner = (*AtomRunner)->ListOfBonds.begin())
|
---|
| 149 | if ((*BondRunner)->leftatom == *AtomRunner)
|
---|
| 150 | delete((*BondRunner));
|
---|
[3c349b] | 151 | BondCount = 0;
|
---|
[cee0b57] | 152 |
|
---|
| 153 | // count atoms in molecule = dimension of matrix (also give each unique name and continuous numbering)
|
---|
[a7b761b] | 154 | DoLog(1) && (Log() << Verbose(1) << "AtomCount " << getAtomCount() << " and bonddistance is " << bonddistance << "." << endl);
|
---|
[cee0b57] | 155 |
|
---|
[c66537] | 156 | if ((getAtomCount() > 1) && (bonddistance > 0.1)) {
|
---|
[a67d19] | 157 | DoLog(2) && (Log() << Verbose(2) << "Creating Linked Cell structure ... " << endl);
|
---|
[af2c424] | 158 | LC = new LinkedCell(*this, bonddistance);
|
---|
[cee0b57] | 159 |
|
---|
[b8b75d] | 160 | // create a list to map Tesselpoint::nr to atom *
|
---|
[a67d19] | 161 | DoLog(2) && (Log() << Verbose(2) << "Creating TesselPoint to atom map ... " << endl);
|
---|
[f2bb0f] | 162 |
|
---|
[53731f] | 163 | // set numbers for atoms that can later be used
|
---|
| 164 | int i=0;
|
---|
| 165 | for(internal_iterator iter = atoms.begin();iter!= atoms.end(); ++iter){
|
---|
| 166 | (*iter)->nr = i++;
|
---|
[cee0b57] | 167 | }
|
---|
| 168 |
|
---|
| 169 | // 3a. go through every cell
|
---|
[a67d19] | 170 | DoLog(2) && (Log() << Verbose(2) << "Celling ... " << endl);
|
---|
[b8b75d] | 171 | for (LC->n[0] = 0; LC->n[0] < LC->N[0]; LC->n[0]++)
|
---|
| 172 | for (LC->n[1] = 0; LC->n[1] < LC->N[1]; LC->n[1]++)
|
---|
| 173 | for (LC->n[2] = 0; LC->n[2] < LC->N[2]; LC->n[2]++) {
|
---|
[734816] | 174 | const LinkedCell::LinkedNodes *List = LC->GetCurrentCell();
|
---|
[e5ad5c] | 175 | // Log() << Verbose(2) << "Current cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
|
---|
[b8b75d] | 176 | if (List != NULL) {
|
---|
[734816] | 177 | for (LinkedCell::LinkedNodes::const_iterator Runner = List->begin(); Runner != List->end(); Runner++) {
|
---|
[f2bb0f] | 178 | Walker = dynamic_cast<atom*>(*Runner);
|
---|
| 179 | ASSERT(Walker,"Tesselpoint that was not an atom retrieved from LinkedNode");
|
---|
[e138de] | 180 | //Log() << Verbose(0) << "Current Atom is " << *Walker << "." << endl;
|
---|
[cee0b57] | 181 | // 3c. check for possible bond between each atom in this and every one in the 27 cells
|
---|
[9eefda] | 182 | for (n[0] = -1; n[0] <= 1; n[0]++)
|
---|
| 183 | for (n[1] = -1; n[1] <= 1; n[1]++)
|
---|
| 184 | for (n[2] = -1; n[2] <= 1; n[2]++) {
|
---|
[734816] | 185 | const LinkedCell::LinkedNodes *OtherList = LC->GetRelativeToCurrentCell(n);
|
---|
[e5ad5c] | 186 | // Log() << Verbose(2) << "Current relative cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
|
---|
[b8b75d] | 187 | if (OtherList != NULL) {
|
---|
[734816] | 188 | for (LinkedCell::LinkedNodes::const_iterator OtherRunner = OtherList->begin(); OtherRunner != OtherList->end(); OtherRunner++) {
|
---|
[b8b75d] | 189 | if ((*OtherRunner)->nr > Walker->nr) {
|
---|
[f2bb0f] | 190 | OtherWalker = dynamic_cast<atom*>(*OtherRunner);
|
---|
| 191 | ASSERT(OtherWalker,"TesselPoint that was not an atom retrieved from LinkedNode");
|
---|
[e138de] | 192 | //Log() << Verbose(1) << "Checking distance " << OtherWalker->x.PeriodicDistanceSquared(&(Walker->x), cell_size) << " against typical bond length of " << bonddistance*bonddistance << "." << endl;
|
---|
[e5ad5c] | 193 | (BG->*minmaxdistance)(Walker, OtherWalker, MinDistance, MaxDistance, IsAngstroem);
|
---|
[d74077] | 194 | const double distance = domain.periodicDistanceSquared(OtherWalker->getPosition(),Walker->getPosition());
|
---|
[b70721] | 195 | const bool status = (distance <= MaxDistance * MaxDistance) && (distance >= MinDistance * MinDistance);
|
---|
[e5ad5c] | 196 | // Log() << Verbose(1) << "MinDistance is " << MinDistance << " and MaxDistance is " << MaxDistance << "." << endl;
|
---|
| 197 | if (OtherWalker->father->nr > Walker->father->nr) {
|
---|
| 198 | if (status) { // create bond if distance is smaller
|
---|
| 199 | // Log() << Verbose(1) << "Adding Bond between " << *Walker << " and " << *OtherWalker << " in distance " << sqrt(distance) << "." << endl;
|
---|
| 200 | AddBond(Walker->father, OtherWalker->father, 1); // also increases molecule::BondCount
|
---|
| 201 | } else {
|
---|
| 202 | // Log() << Verbose(1) << "Not Adding: distance too great." << endl;
|
---|
| 203 | }
|
---|
[b8b75d] | 204 | } else {
|
---|
[e5ad5c] | 205 | // Log() << Verbose(1) << "Not Adding: Wrong order of labels." << endl;
|
---|
[b8b75d] | 206 | }
|
---|
[cee0b57] | 207 | }
|
---|
| 208 | }
|
---|
| 209 | }
|
---|
| 210 | }
|
---|
| 211 | }
|
---|
| 212 | }
|
---|
| 213 | }
|
---|
[9eefda] | 214 | delete (LC);
|
---|
[a67d19] | 215 | DoLog(1) && (Log() << Verbose(1) << "I detected " << BondCount << " bonds in the molecule with distance " << BondDistance << "." << endl);
|
---|
[cee0b57] | 216 |
|
---|
[b8b75d] | 217 | // correct bond degree by comparing valence and bond degree
|
---|
[a67d19] | 218 | DoLog(2) && (Log() << Verbose(2) << "Correcting bond degree ... " << endl);
|
---|
[e138de] | 219 | CorrectBondDegree();
|
---|
[cee0b57] | 220 |
|
---|
[b8b75d] | 221 | // output bonds for debugging (if bond chain list was correctly installed)
|
---|
[e138de] | 222 | ActOnAllAtoms( &atom::OutputBondOfAtom );
|
---|
[b8b75d] | 223 | } else
|
---|
[a7b761b] | 224 | DoLog(1) && (Log() << Verbose(1) << "AtomCount is " << getAtomCount() << ", thus no bonds, no connections!." << endl);
|
---|
[a67d19] | 225 | DoLog(0) && (Log() << Verbose(0) << "End of CreateAdjacencyList." << endl);
|
---|
[b70721] | 226 | if (free_BG)
|
---|
| 227 | delete(BG);
|
---|
[9eefda] | 228 | }
|
---|
| 229 | ;
|
---|
[cee0b57] | 230 |
|
---|
[e08c46] | 231 | /** Checks for presence of bonds within atom list.
|
---|
| 232 | * TODO: more sophisticated check for bond structure (e.g. connected subgraph, ...)
|
---|
| 233 | * \return true - bonds present, false - no bonds
|
---|
| 234 | */
|
---|
| 235 | bool molecule::hasBondStructure()
|
---|
| 236 | {
|
---|
| 237 | for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 238 | if (!(*AtomRunner)->ListOfBonds.empty())
|
---|
| 239 | return true;
|
---|
| 240 | return false;
|
---|
| 241 | }
|
---|
| 242 |
|
---|
| 243 | /** Counts the number of present bonds.
|
---|
| 244 | * \return number of bonds
|
---|
| 245 | */
|
---|
| 246 | unsigned int molecule::CountBonds() const
|
---|
| 247 | {
|
---|
| 248 | unsigned int counter = 0;
|
---|
| 249 | for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 250 | for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
| 251 | if ((*BondRunner)->leftatom == *AtomRunner)
|
---|
| 252 | counter++;
|
---|
| 253 | return counter;
|
---|
| 254 | }
|
---|
| 255 |
|
---|
[b8b75d] | 256 | /** Prints a list of all bonds to \a *out.
|
---|
| 257 | * \param output stream
|
---|
| 258 | */
|
---|
[e138de] | 259 | void molecule::OutputBondsList() const
|
---|
[b8b75d] | 260 | {
|
---|
[a67d19] | 261 | DoLog(1) && (Log() << Verbose(1) << endl << "From contents of bond chain list:");
|
---|
[e08c46] | 262 | for(molecule::const_iterator AtomRunner = molecule::begin(); AtomRunner != molecule::end(); ++AtomRunner)
|
---|
| 263 | for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
| 264 | if ((*BondRunner)->leftatom == *AtomRunner) {
|
---|
| 265 | DoLog(0) && (Log() << Verbose(0) << *(*BondRunner) << "\t" << endl);
|
---|
| 266 | }
|
---|
[a67d19] | 267 | DoLog(0) && (Log() << Verbose(0) << endl);
|
---|
[9eefda] | 268 | }
|
---|
| 269 | ;
|
---|
[cee0b57] | 270 |
|
---|
[b8b75d] | 271 | /** correct bond degree by comparing valence and bond degree.
|
---|
| 272 | * correct Bond degree of each bond by checking both bond partners for a mismatch between valence and current sum of bond degrees,
|
---|
| 273 | * iteratively increase the one first where the other bond partner has the fewest number of bonds (i.e. in general bonds oxygene
|
---|
| 274 | * preferred over carbon bonds). Beforehand, we had picked the first mismatching partner, which lead to oxygenes with single instead of
|
---|
| 275 | * double bonds as was expected.
|
---|
| 276 | * \param *out output stream for debugging
|
---|
| 277 | * \return number of bonds that could not be corrected
|
---|
| 278 | */
|
---|
[e138de] | 279 | int molecule::CorrectBondDegree() const
|
---|
[b8b75d] | 280 | {
|
---|
[99593f] | 281 | int No = 0, OldNo = -1;
|
---|
[b8b75d] | 282 |
|
---|
| 283 | if (BondCount != 0) {
|
---|
[a67d19] | 284 | DoLog(1) && (Log() << Verbose(1) << "Correcting Bond degree of each bond ... " << endl);
|
---|
[b8b75d] | 285 | do {
|
---|
[99593f] | 286 | OldNo = No;
|
---|
[e138de] | 287 | No = SumPerAtom( &atom::CorrectBondDegree );
|
---|
[99593f] | 288 | } while (OldNo != No);
|
---|
[a67d19] | 289 | DoLog(0) && (Log() << Verbose(0) << " done." << endl);
|
---|
[b8b75d] | 290 | } else {
|
---|
[a7b761b] | 291 | DoLog(1) && (Log() << Verbose(1) << "BondCount is " << BondCount << ", no bonds between any of the " << getAtomCount() << " atoms." << endl);
|
---|
[b8b75d] | 292 | }
|
---|
[a67d19] | 293 | DoLog(0) && (Log() << Verbose(0) << No << " bonds could not be corrected." << endl);
|
---|
[cee0b57] | 294 |
|
---|
[266237] | 295 | return (No);
|
---|
[9eefda] | 296 | }
|
---|
| 297 | ;
|
---|
[cee0b57] | 298 |
|
---|
| 299 | /** Counts all cyclic bonds and returns their number.
|
---|
| 300 | * \note Hydrogen bonds can never by cyclic, thus no check for that
|
---|
| 301 | * \param *out output stream for debugging
|
---|
| 302 | * \return number opf cyclic bonds
|
---|
| 303 | */
|
---|
[e138de] | 304 | int molecule::CountCyclicBonds()
|
---|
[cee0b57] | 305 | {
|
---|
[266237] | 306 | NoCyclicBonds = 0;
|
---|
[cee0b57] | 307 | int *MinimumRingSize = NULL;
|
---|
| 308 | MoleculeLeafClass *Subgraphs = NULL;
|
---|
| 309 | class StackClass<bond *> *BackEdgeStack = NULL;
|
---|
[e08c46] | 310 | for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 311 | if ((!(*AtomRunner)->ListOfBonds.empty()) && ((*(*AtomRunner)->ListOfBonds.begin())->Type == Undetermined)) {
|
---|
| 312 | DoLog(0) && (Log() << Verbose(0) << "No Depth-First-Search analysis performed so far, calling ..." << endl);
|
---|
| 313 | Subgraphs = DepthFirstSearchAnalysis(BackEdgeStack);
|
---|
| 314 | while (Subgraphs->next != NULL) {
|
---|
| 315 | Subgraphs = Subgraphs->next;
|
---|
| 316 | delete (Subgraphs->previous);
|
---|
| 317 | }
|
---|
| 318 | delete (Subgraphs);
|
---|
| 319 | delete[] (MinimumRingSize);
|
---|
| 320 | break;
|
---|
[cee0b57] | 321 | }
|
---|
[e08c46] | 322 | for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 323 | for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
| 324 | if ((*BondRunner)->leftatom == *AtomRunner)
|
---|
| 325 | if ((*BondRunner)->Cyclic)
|
---|
| 326 | NoCyclicBonds++;
|
---|
[9eefda] | 327 | delete (BackEdgeStack);
|
---|
[266237] | 328 | return NoCyclicBonds;
|
---|
[9eefda] | 329 | }
|
---|
| 330 | ;
|
---|
[b8b75d] | 331 |
|
---|
[cee0b57] | 332 | /** Returns Shading as a char string.
|
---|
| 333 | * \param color the Shading
|
---|
| 334 | * \return string of the flag
|
---|
| 335 | */
|
---|
[fa649a] | 336 | string molecule::GetColor(enum Shading color) const
|
---|
[cee0b57] | 337 | {
|
---|
[9eefda] | 338 | switch (color) {
|
---|
[cee0b57] | 339 | case white:
|
---|
| 340 | return "white";
|
---|
| 341 | break;
|
---|
| 342 | case lightgray:
|
---|
| 343 | return "lightgray";
|
---|
| 344 | break;
|
---|
| 345 | case darkgray:
|
---|
| 346 | return "darkgray";
|
---|
| 347 | break;
|
---|
| 348 | case black:
|
---|
| 349 | return "black";
|
---|
| 350 | break;
|
---|
| 351 | default:
|
---|
| 352 | return "uncolored";
|
---|
| 353 | break;
|
---|
| 354 | };
|
---|
[9eefda] | 355 | }
|
---|
| 356 | ;
|
---|
[cee0b57] | 357 |
|
---|
[9eefda] | 358 | /** Sets atom::GraphNr and atom::LowpointNr to BFSAccounting::CurrentGraphNr.
|
---|
| 359 | * \param *out output stream for debugging
|
---|
| 360 | * \param *Walker current node
|
---|
| 361 | * \param &BFS structure with accounting data for BFS
|
---|
| 362 | */
|
---|
[e138de] | 363 | void DepthFirstSearchAnalysis_SetWalkersGraphNr(atom *&Walker, struct DFSAccounting &DFS)
|
---|
[174e0e] | 364 | {
|
---|
[9eefda] | 365 | if (!DFS.BackStepping) { // if we don't just return from (8)
|
---|
| 366 | Walker->GraphNr = DFS.CurrentGraphNr;
|
---|
| 367 | Walker->LowpointNr = DFS.CurrentGraphNr;
|
---|
[68f03d] | 368 | DoLog(1) && (Log() << Verbose(1) << "Setting Walker[" << Walker->getName() << "]'s number to " << Walker->GraphNr << " with Lowpoint " << Walker->LowpointNr << "." << endl);
|
---|
[9eefda] | 369 | DFS.AtomStack->Push(Walker);
|
---|
| 370 | DFS.CurrentGraphNr++;
|
---|
[174e0e] | 371 | }
|
---|
[9eefda] | 372 | }
|
---|
| 373 | ;
|
---|
[174e0e] | 374 |
|
---|
[9eefda] | 375 | /** During DFS goes along unvisited bond and touches other atom.
|
---|
| 376 | * Sets bond::type, if
|
---|
| 377 | * -# BackEdge: set atom::LowpointNr and push on \a BackEdgeStack
|
---|
| 378 | * -# TreeEgde: set atom::Ancestor and continue with Walker along this edge
|
---|
| 379 | * Continue until molecule::FindNextUnused() finds no more unused bonds.
|
---|
| 380 | * \param *out output stream for debugging
|
---|
| 381 | * \param *mol molecule with atoms and finding unused bonds
|
---|
| 382 | * \param *&Binder current edge
|
---|
| 383 | * \param &DFS DFS accounting data
|
---|
| 384 | */
|
---|
[e138de] | 385 | void DepthFirstSearchAnalysis_ProbeAlongUnusedBond(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS)
|
---|
[174e0e] | 386 | {
|
---|
| 387 | atom *OtherAtom = NULL;
|
---|
| 388 |
|
---|
| 389 | do { // (3) if Walker has no unused egdes, go to (5)
|
---|
[9eefda] | 390 | DFS.BackStepping = false; // reset backstepping flag for (8)
|
---|
[174e0e] | 391 | if (Binder == NULL) // if we don't just return from (11), Binder is already set to next unused
|
---|
| 392 | Binder = mol->FindNextUnused(Walker);
|
---|
| 393 | if (Binder == NULL)
|
---|
| 394 | break;
|
---|
[a67d19] | 395 | DoLog(2) && (Log() << Verbose(2) << "Current Unused Bond is " << *Binder << "." << endl);
|
---|
[174e0e] | 396 | // (4) Mark Binder used, ...
|
---|
| 397 | Binder->MarkUsed(black);
|
---|
| 398 | OtherAtom = Binder->GetOtherAtom(Walker);
|
---|
[68f03d] | 399 | DoLog(2) && (Log() << Verbose(2) << "(4) OtherAtom is " << OtherAtom->getName() << "." << endl);
|
---|
[174e0e] | 400 | if (OtherAtom->GraphNr != -1) {
|
---|
| 401 | // (4a) ... if "other" atom has been visited (GraphNr != 0), set lowpoint to minimum of both, go to (3)
|
---|
| 402 | Binder->Type = BackEdge;
|
---|
[9eefda] | 403 | DFS.BackEdgeStack->Push(Binder);
|
---|
| 404 | Walker->LowpointNr = (Walker->LowpointNr < OtherAtom->GraphNr) ? Walker->LowpointNr : OtherAtom->GraphNr;
|
---|
[68f03d] | 405 | DoLog(3) && (Log() << Verbose(3) << "(4a) Visited: Setting Lowpoint of Walker[" << Walker->getName() << "] to " << Walker->LowpointNr << "." << endl);
|
---|
[174e0e] | 406 | } else {
|
---|
| 407 | // (4b) ... otherwise set OtherAtom as Ancestor of Walker and Walker as OtherAtom, go to (2)
|
---|
| 408 | Binder->Type = TreeEdge;
|
---|
| 409 | OtherAtom->Ancestor = Walker;
|
---|
| 410 | Walker = OtherAtom;
|
---|
[68f03d] | 411 | DoLog(3) && (Log() << Verbose(3) << "(4b) Not Visited: OtherAtom[" << OtherAtom->getName() << "]'s Ancestor is now " << OtherAtom->Ancestor->getName() << ", Walker is OtherAtom " << OtherAtom->getName() << "." << endl);
|
---|
[174e0e] | 412 | break;
|
---|
| 413 | }
|
---|
| 414 | Binder = NULL;
|
---|
[9eefda] | 415 | } while (1); // (3)
|
---|
| 416 | }
|
---|
| 417 | ;
|
---|
[174e0e] | 418 |
|
---|
[9eefda] | 419 | /** Checks whether we have a new component.
|
---|
| 420 | * if atom::LowpointNr of \a *&Walker is greater than atom::GraphNr of its atom::Ancestor, we have a new component.
|
---|
| 421 | * Meaning that if we touch upon a node who suddenly has a smaller atom::LowpointNr than its ancestor, then we
|
---|
| 422 | * have a found a new branch in the graph tree.
|
---|
| 423 | * \param *out output stream for debugging
|
---|
| 424 | * \param *mol molecule with atoms and finding unused bonds
|
---|
| 425 | * \param *&Walker current node
|
---|
| 426 | * \param &DFS DFS accounting data
|
---|
| 427 | */
|
---|
[e138de] | 428 | void DepthFirstSearchAnalysis_CheckForaNewComponent(const molecule * const mol, atom *&Walker, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
|
---|
[174e0e] | 429 | {
|
---|
| 430 | atom *OtherAtom = NULL;
|
---|
| 431 |
|
---|
| 432 | // (5) if Ancestor of Walker is ...
|
---|
[68f03d] | 433 | DoLog(1) && (Log() << Verbose(1) << "(5) Number of Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "] is " << Walker->Ancestor->GraphNr << "." << endl);
|
---|
[174e0e] | 434 |
|
---|
[9eefda] | 435 | if (Walker->Ancestor->GraphNr != DFS.Root->GraphNr) {
|
---|
[174e0e] | 436 | // (6) (Ancestor of Walker is not Root)
|
---|
| 437 | if (Walker->LowpointNr < Walker->Ancestor->GraphNr) {
|
---|
| 438 | // (6a) set Ancestor's Lowpoint number to minimum of of its Ancestor and itself, go to Step(8)
|
---|
| 439 | Walker->Ancestor->LowpointNr = (Walker->Ancestor->LowpointNr < Walker->LowpointNr) ? Walker->Ancestor->LowpointNr : Walker->LowpointNr;
|
---|
[68f03d] | 440 | DoLog(2) && (Log() << Verbose(2) << "(6) Setting Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s Lowpoint to " << Walker->Ancestor->LowpointNr << "." << endl);
|
---|
[174e0e] | 441 | } else {
|
---|
| 442 | // (7) (Ancestor of Walker is a separating vertex, remove all from stack till Walker (including), these and Ancestor form a component
|
---|
| 443 | Walker->Ancestor->SeparationVertex = true;
|
---|
[68f03d] | 444 | DoLog(2) && (Log() << Verbose(2) << "(7) Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s is a separating vertex, creating component." << endl);
|
---|
[9eefda] | 445 | mol->SetNextComponentNumber(Walker->Ancestor, DFS.ComponentNumber);
|
---|
[68f03d] | 446 | DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Ancestor's Compont is " << DFS.ComponentNumber << "." << endl);
|
---|
[9eefda] | 447 | mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
|
---|
[68f03d] | 448 | DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
|
---|
[174e0e] | 449 | do {
|
---|
[9eefda] | 450 | OtherAtom = DFS.AtomStack->PopLast();
|
---|
[174e0e] | 451 | LeafWalker->Leaf->AddCopyAtom(OtherAtom);
|
---|
[9eefda] | 452 | mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
|
---|
[68f03d] | 453 | DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
|
---|
[174e0e] | 454 | } while (OtherAtom != Walker);
|
---|
[9eefda] | 455 | DFS.ComponentNumber++;
|
---|
[174e0e] | 456 | }
|
---|
| 457 | // (8) Walker becomes its Ancestor, go to (3)
|
---|
[68f03d] | 458 | DoLog(2) && (Log() << Verbose(2) << "(8) Walker[" << Walker->getName() << "] is now its Ancestor " << Walker->Ancestor->getName() << ", backstepping. " << endl);
|
---|
[174e0e] | 459 | Walker = Walker->Ancestor;
|
---|
[9eefda] | 460 | DFS.BackStepping = true;
|
---|
[174e0e] | 461 | }
|
---|
[9eefda] | 462 | }
|
---|
| 463 | ;
|
---|
[174e0e] | 464 |
|
---|
[9eefda] | 465 | /** Cleans the root stack when we have found a component.
|
---|
| 466 | * If we are not DFSAccounting::BackStepping, then we clear the root stack by putting everything into a
|
---|
| 467 | * component down till we meet DFSAccounting::Root.
|
---|
| 468 | * \param *out output stream for debugging
|
---|
| 469 | * \param *mol molecule with atoms and finding unused bonds
|
---|
| 470 | * \param *&Walker current node
|
---|
| 471 | * \param *&Binder current edge
|
---|
| 472 | * \param &DFS DFS accounting data
|
---|
| 473 | */
|
---|
[e138de] | 474 | void DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
|
---|
[174e0e] | 475 | {
|
---|
| 476 | atom *OtherAtom = NULL;
|
---|
| 477 |
|
---|
[9eefda] | 478 | if (!DFS.BackStepping) { // coming from (8) want to go to (3)
|
---|
[174e0e] | 479 | // (9) remove all from stack till Walker (including), these and Root form a component
|
---|
[99593f] | 480 | //DFS.AtomStack->Output(out);
|
---|
[9eefda] | 481 | mol->SetNextComponentNumber(DFS.Root, DFS.ComponentNumber);
|
---|
[68f03d] | 482 | DoLog(3) && (Log() << Verbose(3) << "(9) Root[" << DFS.Root->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
|
---|
[9eefda] | 483 | mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
|
---|
[68f03d] | 484 | DoLog(3) && (Log() << Verbose(3) << "(9) Walker[" << Walker->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
|
---|
[174e0e] | 485 | do {
|
---|
[9eefda] | 486 | OtherAtom = DFS.AtomStack->PopLast();
|
---|
[174e0e] | 487 | LeafWalker->Leaf->AddCopyAtom(OtherAtom);
|
---|
[9eefda] | 488 | mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
|
---|
[68f03d] | 489 | DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
|
---|
[174e0e] | 490 | } while (OtherAtom != Walker);
|
---|
[9eefda] | 491 | DFS.ComponentNumber++;
|
---|
[174e0e] | 492 |
|
---|
| 493 | // (11) Root is separation vertex, set Walker to Root and go to (4)
|
---|
[9eefda] | 494 | Walker = DFS.Root;
|
---|
[174e0e] | 495 | Binder = mol->FindNextUnused(Walker);
|
---|
[68f03d] | 496 | DoLog(1) && (Log() << Verbose(1) << "(10) Walker is Root[" << DFS.Root->getName() << "], next Unused Bond is " << Binder << "." << endl);
|
---|
[174e0e] | 497 | if (Binder != NULL) { // Root is separation vertex
|
---|
[a67d19] | 498 | DoLog(1) && (Log() << Verbose(1) << "(11) Root is a separation vertex." << endl);
|
---|
[174e0e] | 499 | Walker->SeparationVertex = true;
|
---|
| 500 | }
|
---|
| 501 | }
|
---|
[9eefda] | 502 | }
|
---|
| 503 | ;
|
---|
| 504 |
|
---|
| 505 | /** Initializes DFSAccounting structure.
|
---|
| 506 | * \param *out output stream for debugging
|
---|
| 507 | * \param &DFS accounting structure to allocate
|
---|
[7218f8] | 508 | * \param *mol molecule with AtomCount, BondCount and all atoms
|
---|
[9eefda] | 509 | */
|
---|
[e138de] | 510 | void DepthFirstSearchAnalysis_Init(struct DFSAccounting &DFS, const molecule * const mol)
|
---|
[9eefda] | 511 | {
|
---|
[ea7176] | 512 | DFS.AtomStack = new StackClass<atom *> (mol->getAtomCount());
|
---|
[9eefda] | 513 | DFS.CurrentGraphNr = 0;
|
---|
| 514 | DFS.ComponentNumber = 0;
|
---|
| 515 | DFS.BackStepping = false;
|
---|
[7218f8] | 516 | mol->ResetAllBondsToUnused();
|
---|
| 517 | mol->SetAtomValueToValue(-1, &atom::GraphNr);
|
---|
| 518 | mol->ActOnAllAtoms(&atom::InitComponentNr);
|
---|
| 519 | DFS.BackEdgeStack->ClearStack();
|
---|
[9eefda] | 520 | }
|
---|
| 521 | ;
|
---|
[174e0e] | 522 |
|
---|
[9eefda] | 523 | /** Free's DFSAccounting structure.
|
---|
| 524 | * \param *out output stream for debugging
|
---|
| 525 | * \param &DFS accounting structure to free
|
---|
| 526 | */
|
---|
[e138de] | 527 | void DepthFirstSearchAnalysis_Finalize(struct DFSAccounting &DFS)
|
---|
[9eefda] | 528 | {
|
---|
| 529 | delete (DFS.AtomStack);
|
---|
[7218f8] | 530 | // delete (DFS.BackEdgeStack); // DON'T free, see DepthFirstSearchAnalysis(), is returned as allocated
|
---|
[9eefda] | 531 | }
|
---|
| 532 | ;
|
---|
[174e0e] | 533 |
|
---|
[cee0b57] | 534 | /** Performs a Depth-First search on this molecule.
|
---|
| 535 | * Marks bonds in molecule as cyclic, bridge, ... and atoms as
|
---|
| 536 | * articulations points, ...
|
---|
| 537 | * We use the algorithm from [Even, Graph Algorithms, p.62].
|
---|
| 538 | * \param *out output stream for debugging
|
---|
| 539 | * \param *&BackEdgeStack NULL pointer to StackClass with all the found back edges, allocated and filled on return
|
---|
| 540 | * \return list of each disconnected subgraph as an individual molecule class structure
|
---|
| 541 | */
|
---|
[e138de] | 542 | MoleculeLeafClass * molecule::DepthFirstSearchAnalysis(class StackClass<bond *> *&BackEdgeStack) const
|
---|
[cee0b57] | 543 | {
|
---|
[9eefda] | 544 | struct DFSAccounting DFS;
|
---|
[cee0b57] | 545 | BackEdgeStack = new StackClass<bond *> (BondCount);
|
---|
[9eefda] | 546 | DFS.BackEdgeStack = BackEdgeStack;
|
---|
[cee0b57] | 547 | MoleculeLeafClass *SubGraphs = new MoleculeLeafClass(NULL);
|
---|
| 548 | MoleculeLeafClass *LeafWalker = SubGraphs;
|
---|
[9eefda] | 549 | int OldGraphNr = 0;
|
---|
[174e0e] | 550 | atom *Walker = NULL;
|
---|
[cee0b57] | 551 | bond *Binder = NULL;
|
---|
| 552 |
|
---|
[a7b761b] | 553 | if (getAtomCount() == 0)
|
---|
[046783] | 554 | return SubGraphs;
|
---|
[a67d19] | 555 | DoLog(0) && (Log() << Verbose(0) << "Begin of DepthFirstSearchAnalysis" << endl);
|
---|
[e138de] | 556 | DepthFirstSearchAnalysis_Init(DFS, this);
|
---|
[cee0b57] | 557 |
|
---|
[9879f6] | 558 | for (molecule::const_iterator iter = begin(); iter != end();) {
|
---|
| 559 | DFS.Root = *iter;
|
---|
[7218f8] | 560 | // (1) mark all edges unused, empty stack, set atom->GraphNr = -1 for all
|
---|
[9eefda] | 561 | DFS.AtomStack->ClearStack();
|
---|
[cee0b57] | 562 |
|
---|
| 563 | // put into new subgraph molecule and add this to list of subgraphs
|
---|
| 564 | LeafWalker = new MoleculeLeafClass(LeafWalker);
|
---|
[5f612ee] | 565 | LeafWalker->Leaf = World::getInstance().createMolecule();
|
---|
[9eefda] | 566 | LeafWalker->Leaf->AddCopyAtom(DFS.Root);
|
---|
[cee0b57] | 567 |
|
---|
[9eefda] | 568 | OldGraphNr = DFS.CurrentGraphNr;
|
---|
| 569 | Walker = DFS.Root;
|
---|
[cee0b57] | 570 | do { // (10)
|
---|
| 571 | do { // (2) set number and Lowpoint of Atom to i, increase i, push current atom
|
---|
[e138de] | 572 | DepthFirstSearchAnalysis_SetWalkersGraphNr(Walker, DFS);
|
---|
[174e0e] | 573 |
|
---|
[e138de] | 574 | DepthFirstSearchAnalysis_ProbeAlongUnusedBond(this, Walker, Binder, DFS);
|
---|
[174e0e] | 575 |
|
---|
[cee0b57] | 576 | if (Binder == NULL) {
|
---|
[a67d19] | 577 | DoLog(2) && (Log() << Verbose(2) << "No more Unused Bonds." << endl);
|
---|
[cee0b57] | 578 | break;
|
---|
| 579 | } else
|
---|
| 580 | Binder = NULL;
|
---|
[9eefda] | 581 | } while (1); // (2)
|
---|
[cee0b57] | 582 |
|
---|
| 583 | // if we came from backstepping, yet there were no more unused bonds, we end up here with no Ancestor, because Walker is Root! Then we are finished!
|
---|
[9eefda] | 584 | if ((Walker == DFS.Root) && (Binder == NULL))
|
---|
[cee0b57] | 585 | break;
|
---|
| 586 |
|
---|
[e138de] | 587 | DepthFirstSearchAnalysis_CheckForaNewComponent(this, Walker, DFS, LeafWalker);
|
---|
[174e0e] | 588 |
|
---|
[e138de] | 589 | DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(this, Walker, Binder, DFS, LeafWalker);
|
---|
[174e0e] | 590 |
|
---|
[9eefda] | 591 | } while ((DFS.BackStepping) || (Binder != NULL)); // (10) halt only if Root has no unused edges
|
---|
[cee0b57] | 592 |
|
---|
| 593 | // From OldGraphNr to CurrentGraphNr ranges an disconnected subgraph
|
---|
[a67d19] | 594 | DoLog(0) && (Log() << Verbose(0) << "Disconnected subgraph ranges from " << OldGraphNr << " to " << DFS.CurrentGraphNr << "." << endl);
|
---|
[986ed3] | 595 | LeafWalker->Leaf->Output((ofstream *)&(Log() << Verbose(0)));
|
---|
[a67d19] | 596 | DoLog(0) && (Log() << Verbose(0) << endl);
|
---|
[cee0b57] | 597 |
|
---|
| 598 | // step on to next root
|
---|
[9879f6] | 599 | while ((iter != end()) && ((*iter)->GraphNr != -1)) {
|
---|
| 600 | //Log() << Verbose(1) << "Current next subgraph root candidate is " << (*iter)->Name << "." << endl;
|
---|
| 601 | if ((*iter)->GraphNr != -1) // if already discovered, step on
|
---|
| 602 | iter++;
|
---|
[cee0b57] | 603 | }
|
---|
| 604 | }
|
---|
| 605 | // set cyclic bond criterium on "same LP" basis
|
---|
[266237] | 606 | CyclicBondAnalysis();
|
---|
| 607 |
|
---|
[e138de] | 608 | OutputGraphInfoPerAtom();
|
---|
[266237] | 609 |
|
---|
[e138de] | 610 | OutputGraphInfoPerBond();
|
---|
[266237] | 611 |
|
---|
| 612 | // free all and exit
|
---|
[e138de] | 613 | DepthFirstSearchAnalysis_Finalize(DFS);
|
---|
[a67d19] | 614 | DoLog(0) && (Log() << Verbose(0) << "End of DepthFirstSearchAnalysis" << endl);
|
---|
[266237] | 615 | return SubGraphs;
|
---|
[9eefda] | 616 | }
|
---|
| 617 | ;
|
---|
[266237] | 618 |
|
---|
| 619 | /** Scans through all bonds and set bond::Cyclic to true where atom::LowpointNr of both ends is equal: LP criterion.
|
---|
| 620 | */
|
---|
[fa649a] | 621 | void molecule::CyclicBondAnalysis() const
|
---|
[266237] | 622 | {
|
---|
| 623 | NoCyclicBonds = 0;
|
---|
[e08c46] | 624 | for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 625 | for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
| 626 | if ((*BondRunner)->leftatom == *AtomRunner)
|
---|
| 627 | if ((*BondRunner)->rightatom->LowpointNr == (*BondRunner)->leftatom->LowpointNr) { // cyclic ??
|
---|
| 628 | (*BondRunner)->Cyclic = true;
|
---|
| 629 | NoCyclicBonds++;
|
---|
| 630 | }
|
---|
[9eefda] | 631 | }
|
---|
| 632 | ;
|
---|
[cee0b57] | 633 |
|
---|
[266237] | 634 | /** Output graph information per atom.
|
---|
| 635 | * \param *out output stream
|
---|
| 636 | */
|
---|
[e138de] | 637 | void molecule::OutputGraphInfoPerAtom() const
|
---|
[266237] | 638 | {
|
---|
[a67d19] | 639 | DoLog(1) && (Log() << Verbose(1) << "Final graph info for each atom is:" << endl);
|
---|
[e138de] | 640 | ActOnAllAtoms( &atom::OutputGraphInfo );
|
---|
[9eefda] | 641 | }
|
---|
| 642 | ;
|
---|
[cee0b57] | 643 |
|
---|
[266237] | 644 | /** Output graph information per bond.
|
---|
| 645 | * \param *out output stream
|
---|
| 646 | */
|
---|
[e138de] | 647 | void molecule::OutputGraphInfoPerBond() const
|
---|
[266237] | 648 | {
|
---|
[e08c46] | 649 | bond *Binder = NULL;
|
---|
[a67d19] | 650 | DoLog(1) && (Log() << Verbose(1) << "Final graph info for each bond is:" << endl);
|
---|
[e08c46] | 651 | for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
[bd6bfa] | 652 | for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
[e08c46] | 653 | if ((*BondRunner)->leftatom == *AtomRunner) {
|
---|
| 654 | Binder = *BondRunner;
|
---|
[f9183b] | 655 | if (DoLog(2)) {
|
---|
| 656 | ostream &out = (Log() << Verbose(2));
|
---|
| 657 | out << ((Binder->Type == TreeEdge) ? "TreeEdge " : "BackEdge ") << *Binder << ": <";
|
---|
| 658 | out << ((Binder->leftatom->SeparationVertex) ? "SP," : "") << "L" << Binder->leftatom->LowpointNr << " G" << Binder->leftatom->GraphNr << " Comp.";
|
---|
| 659 | Binder->leftatom->OutputComponentNumber(&out);
|
---|
| 660 | out << " === ";
|
---|
| 661 | out << ((Binder->rightatom->SeparationVertex) ? "SP," : "") << "L" << Binder->rightatom->LowpointNr << " G" << Binder->rightatom->GraphNr << " Comp.";
|
---|
| 662 | Binder->rightatom->OutputComponentNumber(&out);
|
---|
| 663 | out << ">." << endl;
|
---|
| 664 | }
|
---|
[e08c46] | 665 | if (Binder->Cyclic) // cyclic ??
|
---|
| 666 | DoLog(3) && (Log() << Verbose(3) << "Lowpoint at each side are equal: CYCLIC!" << endl);
|
---|
| 667 | }
|
---|
[9eefda] | 668 | }
|
---|
| 669 | ;
|
---|
| 670 |
|
---|
| 671 | /** Initialise each vertex as white with no predecessor, empty queue, color Root lightgray.
|
---|
| 672 | * \param *out output stream for debugging
|
---|
| 673 | * \param &BFS accounting structure
|
---|
| 674 | * \param AtomCount number of entries in the array to allocate
|
---|
| 675 | */
|
---|
[e138de] | 676 | void InitializeBFSAccounting(struct BFSAccounting &BFS, int AtomCount)
|
---|
[9eefda] | 677 | {
|
---|
| 678 | BFS.AtomCount = AtomCount;
|
---|
[920c70] | 679 | BFS.PredecessorList = new atom*[AtomCount];
|
---|
| 680 | BFS.ShortestPathList = new int[AtomCount];
|
---|
| 681 | BFS.ColorList = new enum Shading[AtomCount];
|
---|
[9eefda] | 682 | BFS.BFSStack = new StackClass<atom *> (AtomCount);
|
---|
[c27778] | 683 | BFS.TouchedStack = new StackClass<atom *> (AtomCount);
|
---|
[9eefda] | 684 |
|
---|
[920c70] | 685 | for (int i = AtomCount; i--;) {
|
---|
[9eefda] | 686 | BFS.ShortestPathList[i] = -1;
|
---|
[920c70] | 687 | BFS.PredecessorList[i] = 0;
|
---|
[c27778] | 688 | BFS.ColorList[i] = white;
|
---|
[920c70] | 689 | }
|
---|
[cee0b57] | 690 | };
|
---|
| 691 |
|
---|
[9eefda] | 692 | /** Free's accounting structure.
|
---|
| 693 | * \param *out output stream for debugging
|
---|
| 694 | * \param &BFS accounting structure
|
---|
| 695 | */
|
---|
[e138de] | 696 | void FinalizeBFSAccounting(struct BFSAccounting &BFS)
|
---|
[9eefda] | 697 | {
|
---|
[920c70] | 698 | delete[](BFS.PredecessorList);
|
---|
| 699 | delete[](BFS.ShortestPathList);
|
---|
| 700 | delete[](BFS.ColorList);
|
---|
[9eefda] | 701 | delete (BFS.BFSStack);
|
---|
[c27778] | 702 | delete (BFS.TouchedStack);
|
---|
[9eefda] | 703 | BFS.AtomCount = 0;
|
---|
| 704 | };
|
---|
| 705 |
|
---|
| 706 | /** Clean the accounting structure.
|
---|
| 707 | * \param *out output stream for debugging
|
---|
| 708 | * \param &BFS accounting structure
|
---|
[ef9aae] | 709 | */
|
---|
[e138de] | 710 | void CleanBFSAccounting(struct BFSAccounting &BFS)
|
---|
[ef9aae] | 711 | {
|
---|
[9eefda] | 712 | atom *Walker = NULL;
|
---|
| 713 | while (!BFS.TouchedStack->IsEmpty()) {
|
---|
| 714 | Walker = BFS.TouchedStack->PopFirst();
|
---|
| 715 | BFS.PredecessorList[Walker->nr] = NULL;
|
---|
| 716 | BFS.ShortestPathList[Walker->nr] = -1;
|
---|
| 717 | BFS.ColorList[Walker->nr] = white;
|
---|
[ef9aae] | 718 | }
|
---|
| 719 | };
|
---|
| 720 |
|
---|
[9eefda] | 721 | /** Resets shortest path list and BFSStack.
|
---|
| 722 | * \param *out output stream for debugging
|
---|
| 723 | * \param *&Walker current node, pushed onto BFSAccounting::BFSStack and BFSAccounting::TouchedStack
|
---|
| 724 | * \param &BFS accounting structure
|
---|
| 725 | */
|
---|
[e138de] | 726 | void ResetBFSAccounting(atom *&Walker, struct BFSAccounting &BFS)
|
---|
[ef9aae] | 727 | {
|
---|
[9eefda] | 728 | BFS.ShortestPathList[Walker->nr] = 0;
|
---|
| 729 | BFS.BFSStack->ClearStack(); // start with empty BFS stack
|
---|
| 730 | BFS.BFSStack->Push(Walker);
|
---|
| 731 | BFS.TouchedStack->Push(Walker);
|
---|
[ef9aae] | 732 | };
|
---|
| 733 |
|
---|
[9eefda] | 734 | /** Performs a BFS from \a *Root, trying to find the same node and hence a cycle.
|
---|
| 735 | * \param *out output stream for debugging
|
---|
| 736 | * \param *&BackEdge the edge from root that we don't want to move along
|
---|
| 737 | * \param &BFS accounting structure
|
---|
| 738 | */
|
---|
[e138de] | 739 | void CyclicStructureAnalysis_CyclicBFSFromRootToRoot(bond *&BackEdge, struct BFSAccounting &BFS)
|
---|
[ef9aae] | 740 | {
|
---|
| 741 | atom *Walker = NULL;
|
---|
| 742 | atom *OtherAtom = NULL;
|
---|
[9eefda] | 743 | do { // look for Root
|
---|
| 744 | Walker = BFS.BFSStack->PopFirst();
|
---|
[a67d19] | 745 | DoLog(2) && (Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *BFS.Root << "." << endl);
|
---|
[ef9aae] | 746 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
| 747 | if ((*Runner) != BackEdge) { // only walk along DFS spanning tree (otherwise we always find SP of one being backedge Binder)
|
---|
| 748 | OtherAtom = (*Runner)->GetOtherAtom(Walker);
|
---|
[9eefda] | 749 | #ifdef ADDHYDROGEN
|
---|
[83f176] | 750 | if (OtherAtom->getType()->getAtomicNumber() != 1) {
|
---|
[9eefda] | 751 | #endif
|
---|
[68f03d] | 752 | DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
|
---|
[9eefda] | 753 | if (BFS.ColorList[OtherAtom->nr] == white) {
|
---|
| 754 | BFS.TouchedStack->Push(OtherAtom);
|
---|
| 755 | BFS.ColorList[OtherAtom->nr] = lightgray;
|
---|
| 756 | BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
|
---|
| 757 | BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
|
---|
[68f03d] | 758 | DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " lightgray, its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
|
---|
[9eefda] | 759 | //if (BFS.ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr]) { // Check for maximum distance
|
---|
[a67d19] | 760 | DoLog(3) && (Log() << Verbose(3) << "Putting OtherAtom into queue." << endl);
|
---|
[9eefda] | 761 | BFS.BFSStack->Push(OtherAtom);
|
---|
| 762 | //}
|
---|
[ef9aae] | 763 | } else {
|
---|
[a67d19] | 764 | DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
|
---|
[ef9aae] | 765 | }
|
---|
[9eefda] | 766 | if (OtherAtom == BFS.Root)
|
---|
| 767 | break;
|
---|
| 768 | #ifdef ADDHYDROGEN
|
---|
| 769 | } else {
|
---|
[a67d19] | 770 | DoLog(2) && (Log() << Verbose(2) << "Skipping hydrogen atom " << *OtherAtom << "." << endl);
|
---|
[9eefda] | 771 | BFS.ColorList[OtherAtom->nr] = black;
|
---|
| 772 | }
|
---|
| 773 | #endif
|
---|
[ef9aae] | 774 | } else {
|
---|
[a67d19] | 775 | DoLog(2) && (Log() << Verbose(2) << "Bond " << *(*Runner) << " not Visiting, is the back edge." << endl);
|
---|
[ef9aae] | 776 | }
|
---|
| 777 | }
|
---|
[9eefda] | 778 | BFS.ColorList[Walker->nr] = black;
|
---|
[68f03d] | 779 | DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
|
---|
[9eefda] | 780 | if (OtherAtom == BFS.Root) { // if we have found the root, check whether this cycle wasn't already found beforehand
|
---|
[ef9aae] | 781 | // step through predecessor list
|
---|
| 782 | while (OtherAtom != BackEdge->rightatom) {
|
---|
[9eefda] | 783 | if (!OtherAtom->GetTrueFather()->IsCyclic) // if one bond in the loop is not marked as cyclic, we haven't found this cycle yet
|
---|
[ef9aae] | 784 | break;
|
---|
| 785 | else
|
---|
[9eefda] | 786 | OtherAtom = BFS.PredecessorList[OtherAtom->nr];
|
---|
[ef9aae] | 787 | }
|
---|
| 788 | if (OtherAtom == BackEdge->rightatom) { // if each atom in found cycle is cyclic, loop's been found before already
|
---|
[a67d19] | 789 | DoLog(3) && (Log() << Verbose(3) << "This cycle was already found before, skipping and removing seeker from search." << endl);
|
---|
[ef9aae] | 790 | do {
|
---|
[9eefda] | 791 | OtherAtom = BFS.TouchedStack->PopLast();
|
---|
| 792 | if (BFS.PredecessorList[OtherAtom->nr] == Walker) {
|
---|
[a67d19] | 793 | DoLog(4) && (Log() << Verbose(4) << "Removing " << *OtherAtom << " from lists and stacks." << endl);
|
---|
[9eefda] | 794 | BFS.PredecessorList[OtherAtom->nr] = NULL;
|
---|
| 795 | BFS.ShortestPathList[OtherAtom->nr] = -1;
|
---|
| 796 | BFS.ColorList[OtherAtom->nr] = white;
|
---|
| 797 | BFS.BFSStack->RemoveItem(OtherAtom);
|
---|
[ef9aae] | 798 | }
|
---|
[9eefda] | 799 | } while ((!BFS.TouchedStack->IsEmpty()) && (BFS.PredecessorList[OtherAtom->nr] == NULL));
|
---|
| 800 | BFS.TouchedStack->Push(OtherAtom); // last was wrongly popped
|
---|
[ef9aae] | 801 | OtherAtom = BackEdge->rightatom; // set to not Root
|
---|
| 802 | } else
|
---|
[9eefda] | 803 | OtherAtom = BFS.Root;
|
---|
[ef9aae] | 804 | }
|
---|
[9eefda] | 805 | } while ((!BFS.BFSStack->IsEmpty()) && (OtherAtom != BFS.Root) && (OtherAtom != NULL)); // || (ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr])));
|
---|
[ef9aae] | 806 | };
|
---|
| 807 |
|
---|
[9eefda] | 808 | /** Climb back the BFSAccounting::PredecessorList and find cycle members.
|
---|
| 809 | * \param *out output stream for debugging
|
---|
| 810 | * \param *&OtherAtom
|
---|
| 811 | * \param *&BackEdge denotes the edge we did not want to travel along when doing CyclicBFSFromRootToRoot()
|
---|
| 812 | * \param &BFS accounting structure
|
---|
| 813 | * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
|
---|
| 814 | * \param &MinRingSize global minimum distance from one node without encountering oneself, set on return
|
---|
| 815 | */
|
---|
[e138de] | 816 | void CyclicStructureAnalysis_RetrieveCycleMembers(atom *&OtherAtom, bond *&BackEdge, struct BFSAccounting &BFS, int *&MinimumRingSize, int &MinRingSize)
|
---|
[ef9aae] | 817 | {
|
---|
| 818 | atom *Walker = NULL;
|
---|
| 819 | int NumCycles = 0;
|
---|
| 820 | int RingSize = -1;
|
---|
| 821 |
|
---|
[9eefda] | 822 | if (OtherAtom == BFS.Root) {
|
---|
[ef9aae] | 823 | // now climb back the predecessor list and thus find the cycle members
|
---|
| 824 | NumCycles++;
|
---|
| 825 | RingSize = 1;
|
---|
[9eefda] | 826 | BFS.Root->GetTrueFather()->IsCyclic = true;
|
---|
[a67d19] | 827 | DoLog(1) && (Log() << Verbose(1) << "Found ring contains: ");
|
---|
[9eefda] | 828 | Walker = BFS.Root;
|
---|
[ef9aae] | 829 | while (Walker != BackEdge->rightatom) {
|
---|
[68f03d] | 830 | DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " <-> ");
|
---|
[9eefda] | 831 | Walker = BFS.PredecessorList[Walker->nr];
|
---|
[ef9aae] | 832 | Walker->GetTrueFather()->IsCyclic = true;
|
---|
| 833 | RingSize++;
|
---|
| 834 | }
|
---|
[68f03d] | 835 | DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " with a length of " << RingSize << "." << endl << endl);
|
---|
[ef9aae] | 836 | // walk through all and set MinimumRingSize
|
---|
[9eefda] | 837 | Walker = BFS.Root;
|
---|
[ef9aae] | 838 | MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
|
---|
| 839 | while (Walker != BackEdge->rightatom) {
|
---|
[9eefda] | 840 | Walker = BFS.PredecessorList[Walker->nr];
|
---|
[ef9aae] | 841 | if (RingSize < MinimumRingSize[Walker->GetTrueFather()->nr])
|
---|
| 842 | MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
|
---|
| 843 | }
|
---|
| 844 | if ((RingSize < MinRingSize) || (MinRingSize == -1))
|
---|
| 845 | MinRingSize = RingSize;
|
---|
| 846 | } else {
|
---|
[c27778] | 847 | DoLog(1) && (Log() << Verbose(1) << "No ring containing " << *BFS.Root << " with length equal to or smaller than " << MinimumRingSize[BFS.Root->GetTrueFather()->nr] << " found." << endl);
|
---|
[ef9aae] | 848 | }
|
---|
| 849 | };
|
---|
| 850 |
|
---|
[9eefda] | 851 | /** From a given node performs a BFS to touch the next cycle, for whose nodes \a *&MinimumRingSize is set and set it accordingly.
|
---|
| 852 | * \param *out output stream for debugging
|
---|
| 853 | * \param *&Root node to look for closest cycle from, i.e. \a *&MinimumRingSize is set for this node
|
---|
| 854 | * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
|
---|
| 855 | * \param AtomCount number of nodes in graph
|
---|
| 856 | */
|
---|
[e138de] | 857 | void CyclicStructureAnalysis_BFSToNextCycle(atom *&Root, atom *&Walker, int *&MinimumRingSize, int AtomCount)
|
---|
[ef9aae] | 858 | {
|
---|
[9eefda] | 859 | struct BFSAccounting BFS;
|
---|
[ef9aae] | 860 | atom *OtherAtom = Walker;
|
---|
| 861 |
|
---|
[e138de] | 862 | InitializeBFSAccounting(BFS, AtomCount);
|
---|
[ef9aae] | 863 |
|
---|
[e138de] | 864 | ResetBFSAccounting(Walker, BFS);
|
---|
[9eefda] | 865 | while (OtherAtom != NULL) { // look for Root
|
---|
| 866 | Walker = BFS.BFSStack->PopFirst();
|
---|
[e138de] | 867 | //Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *Root << "." << endl;
|
---|
[ef9aae] | 868 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
[9eefda] | 869 | // "removed (*Runner) != BackEdge) || " from next if, is u
|
---|
| 870 | if ((Walker->ListOfBonds.size() == 1)) { // only walk along DFS spanning tree (otherwise we always find SP of 1 being backedge Binder), but terminal hydrogens may be connected via backedge, hence extra check
|
---|
[ef9aae] | 871 | OtherAtom = (*Runner)->GetOtherAtom(Walker);
|
---|
[e138de] | 872 | //Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->Name << " for bond " << *Binder << "." << endl;
|
---|
[9eefda] | 873 | if (BFS.ColorList[OtherAtom->nr] == white) {
|
---|
| 874 | BFS.TouchedStack->Push(OtherAtom);
|
---|
| 875 | BFS.ColorList[OtherAtom->nr] = lightgray;
|
---|
| 876 | BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
|
---|
| 877 | BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
|
---|
[e138de] | 878 | //Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->Name << " lightgray, its predecessor is " << Walker->Name << " and its Shortest Path is " << ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl;
|
---|
[ef9aae] | 879 | if (OtherAtom->GetTrueFather()->IsCyclic) { // if the other atom is connected to a ring
|
---|
[9eefda] | 880 | MinimumRingSize[Root->GetTrueFather()->nr] = BFS.ShortestPathList[OtherAtom->nr] + MinimumRingSize[OtherAtom->GetTrueFather()->nr];
|
---|
[ef9aae] | 881 | OtherAtom = NULL; //break;
|
---|
| 882 | break;
|
---|
| 883 | } else
|
---|
[9eefda] | 884 | BFS.BFSStack->Push(OtherAtom);
|
---|
[ef9aae] | 885 | } else {
|
---|
[e138de] | 886 | //Log() << Verbose(3) << "Not Adding, has already been visited." << endl;
|
---|
[ef9aae] | 887 | }
|
---|
| 888 | } else {
|
---|
[e138de] | 889 | //Log() << Verbose(3) << "Not Visiting, is a back edge." << endl;
|
---|
[ef9aae] | 890 | }
|
---|
| 891 | }
|
---|
[9eefda] | 892 | BFS.ColorList[Walker->nr] = black;
|
---|
[e138de] | 893 | //Log() << Verbose(1) << "Coloring Walker " << Walker->Name << " black." << endl;
|
---|
[ef9aae] | 894 | }
|
---|
| 895 | //CleanAccountingLists(TouchedStack, PredecessorList, ShortestPathList, ColorList);
|
---|
| 896 |
|
---|
[e138de] | 897 | FinalizeBFSAccounting(BFS);
|
---|
[9eefda] | 898 | }
|
---|
| 899 | ;
|
---|
[ef9aae] | 900 |
|
---|
[9eefda] | 901 | /** All nodes that are not in cycles get assigned a \a *&MinimumRingSizeby BFS to next cycle.
|
---|
| 902 | * \param *out output stream for debugging
|
---|
| 903 | * \param *&MinimumRingSize array with minimum distance without encountering onself for each atom
|
---|
| 904 | * \param &MinRingSize global minium distance
|
---|
| 905 | * \param &NumCyles number of cycles in graph
|
---|
| 906 | * \param *mol molecule with atoms
|
---|
| 907 | */
|
---|
[e138de] | 908 | void CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(int *&MinimumRingSize, int &MinRingSize, int &NumCycles, const molecule * const mol)
|
---|
[ef9aae] | 909 | {
|
---|
[9eefda] | 910 | atom *Root = NULL;
|
---|
[ef9aae] | 911 | atom *Walker = NULL;
|
---|
| 912 | if (MinRingSize != -1) { // if rings are present
|
---|
| 913 | // go over all atoms
|
---|
[9879f6] | 914 | for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
|
---|
| 915 | Root = *iter;
|
---|
[ef9aae] | 916 |
|
---|
[ea7176] | 917 | if (MinimumRingSize[Root->GetTrueFather()->nr] == mol->getAtomCount()) { // check whether MinimumRingSize is set, if not BFS to next where it is
|
---|
[ef9aae] | 918 | Walker = Root;
|
---|
| 919 |
|
---|
[e138de] | 920 | //Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl;
|
---|
[ea7176] | 921 | CyclicStructureAnalysis_BFSToNextCycle(Root, Walker, MinimumRingSize, mol->getAtomCount());
|
---|
[ef9aae] | 922 |
|
---|
| 923 | }
|
---|
[a67d19] | 924 | DoLog(1) && (Log() << Verbose(1) << "Minimum ring size of " << *Root << " is " << MinimumRingSize[Root->GetTrueFather()->nr] << "." << endl);
|
---|
[ef9aae] | 925 | }
|
---|
[a67d19] | 926 | DoLog(1) && (Log() << Verbose(1) << "Minimum ring size is " << MinRingSize << ", over " << NumCycles << " cycles total." << endl);
|
---|
[ef9aae] | 927 | } else
|
---|
[a67d19] | 928 | DoLog(1) && (Log() << Verbose(1) << "No rings were detected in the molecular structure." << endl);
|
---|
[9eefda] | 929 | }
|
---|
| 930 | ;
|
---|
[ef9aae] | 931 |
|
---|
[cee0b57] | 932 | /** Analyses the cycles found and returns minimum of all cycle lengths.
|
---|
| 933 | * We begin with a list of Back edges found during DepthFirstSearchAnalysis(). We go through this list - one end is the Root,
|
---|
| 934 | * the other our initial Walker - and do a Breadth First Search for the Root. We mark down each Predecessor and as soon as
|
---|
| 935 | * we have found the Root via BFS, we may climb back the closed cycle via the Predecessors. Thereby we mark atoms and bonds
|
---|
| 936 | * as cyclic and print out the cycles.
|
---|
| 937 | * \param *out output stream for debugging
|
---|
| 938 | * \param *BackEdgeStack stack with all back edges found during DFS scan. Beware: This stack contains the bonds from the total molecule, not from the subgraph!
|
---|
| 939 | * \param *&MinimumRingSize contains smallest ring size in molecular structure on return or -1 if no rings were found, if set is maximum search distance
|
---|
| 940 | * \todo BFS from the not-same-LP to find back to starting point of tributary cycle over more than one bond
|
---|
| 941 | */
|
---|
[e138de] | 942 | void molecule::CyclicStructureAnalysis(class StackClass<bond *> * BackEdgeStack, int *&MinimumRingSize) const
|
---|
[cee0b57] | 943 | {
|
---|
[9eefda] | 944 | struct BFSAccounting BFS;
|
---|
[ef9aae] | 945 | atom *Walker = NULL;
|
---|
| 946 | atom *OtherAtom = NULL;
|
---|
| 947 | bond *BackEdge = NULL;
|
---|
| 948 | int NumCycles = 0;
|
---|
| 949 | int MinRingSize = -1;
|
---|
[cee0b57] | 950 |
|
---|
[ea7176] | 951 | InitializeBFSAccounting(BFS, getAtomCount());
|
---|
[cee0b57] | 952 |
|
---|
[e138de] | 953 | //Log() << Verbose(1) << "Back edge list - ";
|
---|
[99593f] | 954 | //BackEdgeStack->Output(out);
|
---|
[cee0b57] | 955 |
|
---|
[a67d19] | 956 | DoLog(1) && (Log() << Verbose(1) << "Analysing cycles ... " << endl);
|
---|
[cee0b57] | 957 | NumCycles = 0;
|
---|
| 958 | while (!BackEdgeStack->IsEmpty()) {
|
---|
| 959 | BackEdge = BackEdgeStack->PopFirst();
|
---|
| 960 | // this is the target
|
---|
[9eefda] | 961 | BFS.Root = BackEdge->leftatom;
|
---|
[cee0b57] | 962 | // this is the source point
|
---|
| 963 | Walker = BackEdge->rightatom;
|
---|
| 964 |
|
---|
[e138de] | 965 | ResetBFSAccounting(Walker, BFS);
|
---|
[cee0b57] | 966 |
|
---|
[a67d19] | 967 | DoLog(1) && (Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl);
|
---|
[ef9aae] | 968 | OtherAtom = NULL;
|
---|
[e138de] | 969 | CyclicStructureAnalysis_CyclicBFSFromRootToRoot(BackEdge, BFS);
|
---|
[cee0b57] | 970 |
|
---|
[e138de] | 971 | CyclicStructureAnalysis_RetrieveCycleMembers(OtherAtom, BackEdge, BFS, MinimumRingSize, MinRingSize);
|
---|
[cee0b57] | 972 |
|
---|
[e138de] | 973 | CleanBFSAccounting(BFS);
|
---|
[ef9aae] | 974 | }
|
---|
[e138de] | 975 | FinalizeBFSAccounting(BFS);
|
---|
[ef9aae] | 976 |
|
---|
[e138de] | 977 | CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(MinimumRingSize, MinRingSize, NumCycles, this);
|
---|
[fa649a] | 978 | };
|
---|
[cee0b57] | 979 |
|
---|
| 980 | /** Sets the next component number.
|
---|
| 981 | * This is O(N) as the number of bonds per atom is bound.
|
---|
| 982 | * \param *vertex atom whose next atom::*ComponentNr is to be set
|
---|
| 983 | * \param nr number to use
|
---|
| 984 | */
|
---|
[fa649a] | 985 | void molecule::SetNextComponentNumber(atom *vertex, int nr) const
|
---|
[cee0b57] | 986 | {
|
---|
[9eefda] | 987 | size_t i = 0;
|
---|
[cee0b57] | 988 | if (vertex != NULL) {
|
---|
[9eefda] | 989 | for (; i < vertex->ListOfBonds.size(); i++) {
|
---|
| 990 | if (vertex->ComponentNr[i] == -1) { // check if not yet used
|
---|
[cee0b57] | 991 | vertex->ComponentNr[i] = nr;
|
---|
| 992 | break;
|
---|
[9eefda] | 993 | } else if (vertex->ComponentNr[i] == nr) // if number is already present, don't add another time
|
---|
| 994 | break; // breaking here will not cause error!
|
---|
[cee0b57] | 995 | }
|
---|
[e359a8] | 996 | if (i == vertex->ListOfBonds.size()) {
|
---|
[58ed4a] | 997 | DoeLog(0) && (eLog()<< Verbose(0) << "Error: All Component entries are already occupied!" << endl);
|
---|
[e359a8] | 998 | performCriticalExit();
|
---|
| 999 | }
|
---|
| 1000 | } else {
|
---|
[58ed4a] | 1001 | DoeLog(0) && (eLog()<< Verbose(0) << "Error: Given vertex is NULL!" << endl);
|
---|
[e359a8] | 1002 | performCriticalExit();
|
---|
| 1003 | }
|
---|
[9eefda] | 1004 | }
|
---|
| 1005 | ;
|
---|
[cee0b57] | 1006 |
|
---|
| 1007 | /** Returns next unused bond for this atom \a *vertex or NULL of none exists.
|
---|
| 1008 | * \param *vertex atom to regard
|
---|
| 1009 | * \return bond class or NULL
|
---|
| 1010 | */
|
---|
[fa649a] | 1011 | bond * molecule::FindNextUnused(atom *vertex) const
|
---|
[cee0b57] | 1012 | {
|
---|
[266237] | 1013 | for (BondList::const_iterator Runner = vertex->ListOfBonds.begin(); Runner != vertex->ListOfBonds.end(); (++Runner))
|
---|
| 1014 | if ((*Runner)->IsUsed() == white)
|
---|
[9eefda] | 1015 | return ((*Runner));
|
---|
[cee0b57] | 1016 | return NULL;
|
---|
[9eefda] | 1017 | }
|
---|
| 1018 | ;
|
---|
[cee0b57] | 1019 |
|
---|
| 1020 | /** Resets bond::Used flag of all bonds in this molecule.
|
---|
| 1021 | * \return true - success, false - -failure
|
---|
| 1022 | */
|
---|
[fa649a] | 1023 | void molecule::ResetAllBondsToUnused() const
|
---|
[cee0b57] | 1024 | {
|
---|
[e08c46] | 1025 | for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
|
---|
| 1026 | for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
|
---|
| 1027 | if ((*BondRunner)->leftatom == *AtomRunner)
|
---|
| 1028 | (*BondRunner)->ResetUsed();
|
---|
[9eefda] | 1029 | }
|
---|
| 1030 | ;
|
---|
[cee0b57] | 1031 |
|
---|
| 1032 | /** Output a list of flags, stating whether the bond was visited or not.
|
---|
| 1033 | * \param *out output stream for debugging
|
---|
| 1034 | * \param *list
|
---|
| 1035 | */
|
---|
[e138de] | 1036 | void OutputAlreadyVisited(int *list)
|
---|
[cee0b57] | 1037 | {
|
---|
[a67d19] | 1038 | DoLog(4) && (Log() << Verbose(4) << "Already Visited Bonds:\t");
|
---|
[9eefda] | 1039 | for (int i = 1; i <= list[0]; i++)
|
---|
[a67d19] | 1040 | DoLog(0) && (Log() << Verbose(0) << list[i] << " ");
|
---|
| 1041 | DoLog(0) && (Log() << Verbose(0) << endl);
|
---|
[9eefda] | 1042 | }
|
---|
| 1043 | ;
|
---|
[cee0b57] | 1044 |
|
---|
| 1045 | /** Storing the bond structure of a molecule to file.
|
---|
| 1046 | * Simply stores Atom::nr and then the Atom::nr of all bond partners per line.
|
---|
[35b698] | 1047 | * \param &filename name of file
|
---|
| 1048 | * \param path path to file, defaults to empty
|
---|
[cee0b57] | 1049 | * \return true - file written successfully, false - writing failed
|
---|
| 1050 | */
|
---|
[35b698] | 1051 | bool molecule::StoreAdjacencyToFile(std::string &filename, std::string path)
|
---|
[cee0b57] | 1052 | {
|
---|
| 1053 | ofstream AdjacencyFile;
|
---|
[35b698] | 1054 | string line;
|
---|
[cee0b57] | 1055 | bool status = true;
|
---|
| 1056 |
|
---|
[35b698] | 1057 | if (path != "")
|
---|
| 1058 | line = path + "/" + filename;
|
---|
[8ab0407] | 1059 | else
|
---|
[35b698] | 1060 | line = filename;
|
---|
| 1061 | AdjacencyFile.open(line.c_str(), ios::out);
|
---|
[acf800] | 1062 | DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
|
---|
[35b698] | 1063 | if (AdjacencyFile.good()) {
|
---|
[1f1b23] | 1064 | AdjacencyFile << "m\tn" << endl;
|
---|
[9eefda] | 1065 | ActOnAllAtoms(&atom::OutputAdjacency, &AdjacencyFile);
|
---|
[cee0b57] | 1066 | AdjacencyFile.close();
|
---|
[acf800] | 1067 | DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
|
---|
[cee0b57] | 1068 | } else {
|
---|
[35b698] | 1069 | DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
|
---|
[cee0b57] | 1070 | status = false;
|
---|
| 1071 | }
|
---|
| 1072 |
|
---|
| 1073 | return status;
|
---|
[9eefda] | 1074 | }
|
---|
| 1075 | ;
|
---|
[cee0b57] | 1076 |
|
---|
[1f1b23] | 1077 | /** Storing the bond structure of a molecule to file.
|
---|
| 1078 | * Simply stores Atom::nr and then the Atom::nr of all bond partners, one per line.
|
---|
[35b698] | 1079 | * \param &filename name of file
|
---|
| 1080 | * \param path path to file, defaults to empty
|
---|
[1f1b23] | 1081 | * \return true - file written successfully, false - writing failed
|
---|
| 1082 | */
|
---|
[35b698] | 1083 | bool molecule::StoreBondsToFile(std::string &filename, std::string path)
|
---|
[1f1b23] | 1084 | {
|
---|
| 1085 | ofstream BondFile;
|
---|
[35b698] | 1086 | string line;
|
---|
[1f1b23] | 1087 | bool status = true;
|
---|
| 1088 |
|
---|
[35b698] | 1089 | if (path != "")
|
---|
| 1090 | line = path + "/" + filename;
|
---|
[8ab0407] | 1091 | else
|
---|
[35b698] | 1092 | line = filename;
|
---|
| 1093 | BondFile.open(line.c_str(), ios::out);
|
---|
[acf800] | 1094 | DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
|
---|
[35b698] | 1095 | if (BondFile.good()) {
|
---|
[1f1b23] | 1096 | BondFile << "m\tn" << endl;
|
---|
| 1097 | ActOnAllAtoms(&atom::OutputBonds, &BondFile);
|
---|
| 1098 | BondFile.close();
|
---|
[acf800] | 1099 | DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
|
---|
[1f1b23] | 1100 | } else {
|
---|
[35b698] | 1101 | DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
|
---|
[1f1b23] | 1102 | status = false;
|
---|
| 1103 | }
|
---|
| 1104 |
|
---|
| 1105 | return status;
|
---|
| 1106 | }
|
---|
| 1107 | ;
|
---|
| 1108 |
|
---|
[35b698] | 1109 | bool CheckAdjacencyFileAgainstMolecule_Init(std::string &path, ifstream &File, int *&CurrentBonds)
|
---|
[ba4170] | 1110 | {
|
---|
[35b698] | 1111 | string filename;
|
---|
| 1112 | filename = path + ADJACENCYFILE;
|
---|
| 1113 | File.open(filename.c_str(), ios::out);
|
---|
[0de7e8] | 1114 | DoLog(1) && (Log() << Verbose(1) << "Looking at bond structure stored in adjacency file and comparing to present one ... " << endl);
|
---|
[35b698] | 1115 | if (File.fail())
|
---|
[ba4170] | 1116 | return false;
|
---|
| 1117 |
|
---|
| 1118 | // allocate storage structure
|
---|
[920c70] | 1119 | CurrentBonds = new int[8]; // contains parsed bonds of current atom
|
---|
| 1120 | for(int i=0;i<8;i++)
|
---|
| 1121 | CurrentBonds[i] = 0;
|
---|
[ba4170] | 1122 | return true;
|
---|
[9eefda] | 1123 | }
|
---|
| 1124 | ;
|
---|
[ba4170] | 1125 |
|
---|
[e138de] | 1126 | void CheckAdjacencyFileAgainstMolecule_Finalize(ifstream &File, int *&CurrentBonds)
|
---|
[ba4170] | 1127 | {
|
---|
| 1128 | File.close();
|
---|
| 1129 | File.clear();
|
---|
[920c70] | 1130 | delete[](CurrentBonds);
|
---|
[9eefda] | 1131 | }
|
---|
| 1132 | ;
|
---|
[ba4170] | 1133 |
|
---|
[e138de] | 1134 | void CheckAdjacencyFileAgainstMolecule_CompareBonds(bool &status, int &NonMatchNumber, atom *&Walker, size_t &CurrentBondsOfAtom, int AtomNr, int *&CurrentBonds, atom **ListOfAtoms)
|
---|
[ba4170] | 1135 | {
|
---|
| 1136 | size_t j = 0;
|
---|
| 1137 | int id = -1;
|
---|
| 1138 |
|
---|
[e138de] | 1139 | //Log() << Verbose(2) << "Walker is " << *Walker << ", bond partners: ";
|
---|
[ba4170] | 1140 | if (CurrentBondsOfAtom == Walker->ListOfBonds.size()) {
|
---|
| 1141 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
| 1142 | id = (*Runner)->GetOtherAtom(Walker)->nr;
|
---|
| 1143 | j = 0;
|
---|
[9eefda] | 1144 | for (; (j < CurrentBondsOfAtom) && (CurrentBonds[j++] != id);)
|
---|
[ba4170] | 1145 | ; // check against all parsed bonds
|
---|
[9eefda] | 1146 | if (CurrentBonds[j - 1] != id) { // no match ? Then mark in ListOfAtoms
|
---|
[ba4170] | 1147 | ListOfAtoms[AtomNr] = NULL;
|
---|
| 1148 | NonMatchNumber++;
|
---|
| 1149 | status = false;
|
---|
[0de7e8] | 1150 | DoeLog(2) && (eLog() << Verbose(2) << id << " can not be found in list." << endl);
|
---|
[ba4170] | 1151 | } else {
|
---|
[0de7e8] | 1152 | //Log() << Verbose(0) << "[" << id << "]\t";
|
---|
[ba4170] | 1153 | }
|
---|
| 1154 | }
|
---|
[e138de] | 1155 | //Log() << Verbose(0) << endl;
|
---|
[ba4170] | 1156 | } else {
|
---|
[a67d19] | 1157 | DoLog(0) && (Log() << Verbose(0) << "Number of bonds for Atom " << *Walker << " does not match, parsed " << CurrentBondsOfAtom << " against " << Walker->ListOfBonds.size() << "." << endl);
|
---|
[ba4170] | 1158 | status = false;
|
---|
| 1159 | }
|
---|
[9eefda] | 1160 | }
|
---|
| 1161 | ;
|
---|
[ba4170] | 1162 |
|
---|
[cee0b57] | 1163 | /** Checks contents of adjacency file against bond structure in structure molecule.
|
---|
| 1164 | * \param *out output stream for debugging
|
---|
| 1165 | * \param *path path to file
|
---|
| 1166 | * \param **ListOfAtoms allocated (molecule::AtomCount) and filled lookup table for ids (Atom::nr) to *Atom
|
---|
| 1167 | * \return true - structure is equal, false - not equivalence
|
---|
| 1168 | */
|
---|
[35b698] | 1169 | bool molecule::CheckAdjacencyFileAgainstMolecule(std::string &path, atom **ListOfAtoms)
|
---|
[cee0b57] | 1170 | {
|
---|
| 1171 | ifstream File;
|
---|
| 1172 | bool status = true;
|
---|
[266237] | 1173 | atom *Walker = NULL;
|
---|
[ba4170] | 1174 | int *CurrentBonds = NULL;
|
---|
[9eefda] | 1175 | int NonMatchNumber = 0; // will number of atoms with differing bond structure
|
---|
[ba4170] | 1176 | size_t CurrentBondsOfAtom = -1;
|
---|
[0de7e8] | 1177 | const int AtomCount = getAtomCount();
|
---|
[cee0b57] | 1178 |
|
---|
[e138de] | 1179 | if (!CheckAdjacencyFileAgainstMolecule_Init(path, File, CurrentBonds)) {
|
---|
[a67d19] | 1180 | DoLog(1) && (Log() << Verbose(1) << "Adjacency file not found." << endl);
|
---|
[ba4170] | 1181 | return true;
|
---|
| 1182 | }
|
---|
| 1183 |
|
---|
[920c70] | 1184 | char buffer[MAXSTRINGSIZE];
|
---|
[ba4170] | 1185 | // Parse the file line by line and count the bonds
|
---|
| 1186 | while (!File.eof()) {
|
---|
| 1187 | File.getline(buffer, MAXSTRINGSIZE);
|
---|
| 1188 | stringstream line;
|
---|
| 1189 | line.str(buffer);
|
---|
| 1190 | int AtomNr = -1;
|
---|
| 1191 | line >> AtomNr;
|
---|
| 1192 | CurrentBondsOfAtom = -1; // we count one too far due to line end
|
---|
| 1193 | // parse into structure
|
---|
[0de7e8] | 1194 | if ((AtomNr >= 0) && (AtomNr < AtomCount)) {
|
---|
[ba4170] | 1195 | Walker = ListOfAtoms[AtomNr];
|
---|
| 1196 | while (!line.eof())
|
---|
[9eefda] | 1197 | line >> CurrentBonds[++CurrentBondsOfAtom];
|
---|
[ba4170] | 1198 | // compare against present bonds
|
---|
[e138de] | 1199 | CheckAdjacencyFileAgainstMolecule_CompareBonds(status, NonMatchNumber, Walker, CurrentBondsOfAtom, AtomNr, CurrentBonds, ListOfAtoms);
|
---|
[0de7e8] | 1200 | } else {
|
---|
| 1201 | if (AtomNr != -1)
|
---|
| 1202 | DoeLog(2) && (eLog() << Verbose(2) << AtomNr << " is not valid in the range of ids [" << 0 << "," << AtomCount << ")." << endl);
|
---|
[ba4170] | 1203 | }
|
---|
[cee0b57] | 1204 | }
|
---|
[e138de] | 1205 | CheckAdjacencyFileAgainstMolecule_Finalize(File, CurrentBonds);
|
---|
[cee0b57] | 1206 |
|
---|
[ba4170] | 1207 | if (status) { // if equal we parse the KeySetFile
|
---|
[a67d19] | 1208 | DoLog(1) && (Log() << Verbose(1) << "done: Equal." << endl);
|
---|
[ba4170] | 1209 | } else
|
---|
[a67d19] | 1210 | DoLog(1) && (Log() << Verbose(1) << "done: Not equal by " << NonMatchNumber << " atoms." << endl);
|
---|
[cee0b57] | 1211 | return status;
|
---|
[9eefda] | 1212 | }
|
---|
| 1213 | ;
|
---|
[cee0b57] | 1214 |
|
---|
| 1215 | /** Picks from a global stack with all back edges the ones in the fragment.
|
---|
| 1216 | * \param *out output stream for debugging
|
---|
| 1217 | * \param **ListOfLocalAtoms array of father atom::nr to local atom::nr (reverse of atom::father)
|
---|
| 1218 | * \param *ReferenceStack stack with all the back egdes
|
---|
| 1219 | * \param *LocalStack stack to be filled
|
---|
| 1220 | * \return true - everything ok, false - ReferenceStack was empty
|
---|
| 1221 | */
|
---|
[e138de] | 1222 | bool molecule::PickLocalBackEdges(atom **ListOfLocalAtoms, class StackClass<bond *> *&ReferenceStack, class StackClass<bond *> *&LocalStack) const
|
---|
[cee0b57] | 1223 | {
|
---|
| 1224 | bool status = true;
|
---|
| 1225 | if (ReferenceStack->IsEmpty()) {
|
---|
[a67d19] | 1226 | DoLog(1) && (Log() << Verbose(1) << "ReferenceStack is empty!" << endl);
|
---|
[cee0b57] | 1227 | return false;
|
---|
| 1228 | }
|
---|
| 1229 | bond *Binder = ReferenceStack->PopFirst();
|
---|
[9eefda] | 1230 | bond *FirstBond = Binder; // mark the first bond, so that we don't loop through the stack indefinitely
|
---|
[cee0b57] | 1231 | atom *Walker = NULL, *OtherAtom = NULL;
|
---|
| 1232 | ReferenceStack->Push(Binder);
|
---|
| 1233 |
|
---|
[9eefda] | 1234 | do { // go through all bonds and push local ones
|
---|
| 1235 | Walker = ListOfLocalAtoms[Binder->leftatom->nr]; // get one atom in the reference molecule
|
---|
[cee0b57] | 1236 | if (Walker != NULL) // if this Walker exists in the subgraph ...
|
---|
[266237] | 1237 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
| 1238 | OtherAtom = (*Runner)->GetOtherAtom(Walker);
|
---|
| 1239 | if (OtherAtom == ListOfLocalAtoms[(*Runner)->rightatom->nr]) { // found the bond
|
---|
| 1240 | LocalStack->Push((*Runner));
|
---|
[a67d19] | 1241 | DoLog(3) && (Log() << Verbose(3) << "Found local edge " << *(*Runner) << "." << endl);
|
---|
[cee0b57] | 1242 | break;
|
---|
| 1243 | }
|
---|
| 1244 | }
|
---|
[9eefda] | 1245 | Binder = ReferenceStack->PopFirst(); // loop the stack for next item
|
---|
[a67d19] | 1246 | DoLog(3) && (Log() << Verbose(3) << "Current candidate edge " << Binder << "." << endl);
|
---|
[cee0b57] | 1247 | ReferenceStack->Push(Binder);
|
---|
| 1248 | } while (FirstBond != Binder);
|
---|
| 1249 |
|
---|
| 1250 | return status;
|
---|
[9eefda] | 1251 | }
|
---|
| 1252 | ;
|
---|
[ce7cc5] | 1253 |
|
---|
| 1254 | void BreadthFirstSearchAdd_Init(struct BFSAccounting &BFS, atom *&Root, int AtomCount, int BondOrder, atom **AddedAtomList = NULL)
|
---|
| 1255 | {
|
---|
| 1256 | BFS.AtomCount = AtomCount;
|
---|
| 1257 | BFS.BondOrder = BondOrder;
|
---|
[920c70] | 1258 | BFS.PredecessorList = new atom*[AtomCount];
|
---|
| 1259 | BFS.ShortestPathList = new int[AtomCount];
|
---|
| 1260 | BFS.ColorList = new enum Shading[AtomCount];
|
---|
[9eefda] | 1261 | BFS.BFSStack = new StackClass<atom *> (AtomCount);
|
---|
[ce7cc5] | 1262 |
|
---|
| 1263 | BFS.Root = Root;
|
---|
[9eefda] | 1264 | BFS.BFSStack->ClearStack();
|
---|
| 1265 | BFS.BFSStack->Push(Root);
|
---|
[ce7cc5] | 1266 |
|
---|
| 1267 | // initialise each vertex as white with no predecessor, empty queue, color Root lightgray
|
---|
[9eefda] | 1268 | for (int i = AtomCount; i--;) {
|
---|
[920c70] | 1269 | BFS.PredecessorList[i] = NULL;
|
---|
[ce7cc5] | 1270 | BFS.ShortestPathList[i] = -1;
|
---|
| 1271 | if ((AddedAtomList != NULL) && (AddedAtomList[i] != NULL)) // mark already present atoms (i.e. Root and maybe others) as visited
|
---|
| 1272 | BFS.ColorList[i] = lightgray;
|
---|
| 1273 | else
|
---|
| 1274 | BFS.ColorList[i] = white;
|
---|
| 1275 | }
|
---|
[920c70] | 1276 | //BFS.ShortestPathList[Root->nr] = 0; // done by Calloc
|
---|
[9eefda] | 1277 | }
|
---|
| 1278 | ;
|
---|
[ce7cc5] | 1279 |
|
---|
| 1280 | void BreadthFirstSearchAdd_Free(struct BFSAccounting &BFS)
|
---|
| 1281 | {
|
---|
[920c70] | 1282 | delete[](BFS.PredecessorList);
|
---|
| 1283 | delete[](BFS.ShortestPathList);
|
---|
| 1284 | delete[](BFS.ColorList);
|
---|
[9eefda] | 1285 | delete (BFS.BFSStack);
|
---|
[ce7cc5] | 1286 | BFS.AtomCount = 0;
|
---|
[9eefda] | 1287 | }
|
---|
| 1288 | ;
|
---|
[ce7cc5] | 1289 |
|
---|
[e138de] | 1290 | void BreadthFirstSearchAdd_UnvisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
|
---|
[ce7cc5] | 1291 | {
|
---|
| 1292 | if (Binder != Bond) // let other atom white if it's via Root bond. In case it's cyclic it has to be reached again (yet Root is from OtherAtom already black, thus no problem)
|
---|
| 1293 | BFS.ColorList[OtherAtom->nr] = lightgray;
|
---|
[9eefda] | 1294 | BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
|
---|
| 1295 | BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
|
---|
[68f03d] | 1296 | DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " " << ((BFS.ColorList[OtherAtom->nr] == white) ? "white" : "lightgray") << ", its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
|
---|
[9eefda] | 1297 | if ((((BFS.ShortestPathList[OtherAtom->nr] < BFS.BondOrder) && (Binder != Bond)))) { // Check for maximum distance
|
---|
[a67d19] | 1298 | DoLog(3) && (Log() << Verbose(3));
|
---|
[ce7cc5] | 1299 | if (AddedAtomList[OtherAtom->nr] == NULL) { // add if it's not been so far
|
---|
| 1300 | AddedAtomList[OtherAtom->nr] = Mol->AddCopyAtom(OtherAtom);
|
---|
[68f03d] | 1301 | DoLog(0) && (Log() << Verbose(0) << "Added OtherAtom " << OtherAtom->getName());
|
---|
[ce7cc5] | 1302 | AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
|
---|
[a67d19] | 1303 | DoLog(0) && (Log() << Verbose(0) << " and bond " << *(AddedBondList[Binder->nr]) << ", ");
|
---|
[9eefda] | 1304 | } else { // this code should actually never come into play (all white atoms are not yet present in BondMolecule, that's why they are white in the first place)
|
---|
[68f03d] | 1305 | DoLog(0) && (Log() << Verbose(0) << "Not adding OtherAtom " << OtherAtom->getName());
|
---|
[ce7cc5] | 1306 | if (AddedBondList[Binder->nr] == NULL) {
|
---|
| 1307 | AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
|
---|
[a67d19] | 1308 | DoLog(0) && (Log() << Verbose(0) << ", added Bond " << *(AddedBondList[Binder->nr]));
|
---|
[ce7cc5] | 1309 | } else
|
---|
[a67d19] | 1310 | DoLog(0) && (Log() << Verbose(0) << ", not added Bond ");
|
---|
[ce7cc5] | 1311 | }
|
---|
[a67d19] | 1312 | DoLog(0) && (Log() << Verbose(0) << ", putting OtherAtom into queue." << endl);
|
---|
[9eefda] | 1313 | BFS.BFSStack->Push(OtherAtom);
|
---|
[ce7cc5] | 1314 | } else { // out of bond order, then replace
|
---|
| 1315 | if ((AddedAtomList[OtherAtom->nr] == NULL) && (Binder->Cyclic))
|
---|
| 1316 | BFS.ColorList[OtherAtom->nr] = white; // unmark if it has not been queued/added, to make it available via its other bonds (cyclic)
|
---|
| 1317 | if (Binder == Bond)
|
---|
[a67d19] | 1318 | DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is the Root bond");
|
---|
[ce7cc5] | 1319 | else if (BFS.ShortestPathList[OtherAtom->nr] >= BFS.BondOrder)
|
---|
[a67d19] | 1320 | DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is out of Bond Count of " << BFS.BondOrder);
|
---|
[ce7cc5] | 1321 | if (!Binder->Cyclic)
|
---|
[a67d19] | 1322 | DoLog(0) && (Log() << Verbose(0) << ", is not part of a cyclic bond, saturating bond with Hydrogen." << endl);
|
---|
[ce7cc5] | 1323 | if (AddedBondList[Binder->nr] == NULL) {
|
---|
| 1324 | if ((AddedAtomList[OtherAtom->nr] != NULL)) { // .. whether we add or saturate
|
---|
| 1325 | AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
|
---|
| 1326 | } else {
|
---|
[9eefda] | 1327 | #ifdef ADDHYDROGEN
|
---|
[e138de] | 1328 | if (!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
|
---|
[9eefda] | 1329 | exit(1);
|
---|
| 1330 | #endif
|
---|
[ce7cc5] | 1331 | }
|
---|
| 1332 | }
|
---|
| 1333 | }
|
---|
[9eefda] | 1334 | }
|
---|
| 1335 | ;
|
---|
[ce7cc5] | 1336 |
|
---|
[e138de] | 1337 | void BreadthFirstSearchAdd_VisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
|
---|
[ce7cc5] | 1338 | {
|
---|
[a67d19] | 1339 | DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
|
---|
[ce7cc5] | 1340 | // This has to be a cyclic bond, check whether it's present ...
|
---|
| 1341 | if (AddedBondList[Binder->nr] == NULL) {
|
---|
[9eefda] | 1342 | if ((Binder != Bond) && (Binder->Cyclic) && (((BFS.ShortestPathList[Walker->nr] + 1) < BFS.BondOrder))) {
|
---|
[ce7cc5] | 1343 | AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
|
---|
| 1344 | } else { // if it's root bond it has to broken (otherwise we would not create the fragments)
|
---|
[9eefda] | 1345 | #ifdef ADDHYDROGEN
|
---|
[e138de] | 1346 | if(!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
|
---|
[9eefda] | 1347 | exit(1);
|
---|
| 1348 | #endif
|
---|
[ce7cc5] | 1349 | }
|
---|
| 1350 | }
|
---|
[9eefda] | 1351 | }
|
---|
| 1352 | ;
|
---|
[cee0b57] | 1353 |
|
---|
| 1354 | /** Adds atoms up to \a BondCount distance from \a *Root and notes them down in \a **AddedAtomList.
|
---|
| 1355 | * Gray vertices are always enqueued in an StackClass<atom *> FIFO queue, the rest is usual BFS with adding vertices found was
|
---|
| 1356 | * white and putting into queue.
|
---|
| 1357 | * \param *out output stream for debugging
|
---|
| 1358 | * \param *Mol Molecule class to add atoms to
|
---|
| 1359 | * \param **AddedAtomList list with added atom pointers, index is atom father's number
|
---|
| 1360 | * \param **AddedBondList list with added bond pointers, index is bond father's number
|
---|
| 1361 | * \param *Root root vertex for BFS
|
---|
| 1362 | * \param *Bond bond not to look beyond
|
---|
| 1363 | * \param BondOrder maximum distance for vertices to add
|
---|
| 1364 | * \param IsAngstroem lengths are in angstroem or bohrradii
|
---|
| 1365 | */
|
---|
[e138de] | 1366 | void molecule::BreadthFirstSearchAdd(molecule *Mol, atom **&AddedAtomList, bond **&AddedBondList, atom *Root, bond *Bond, int BondOrder, bool IsAngstroem)
|
---|
[cee0b57] | 1367 | {
|
---|
[ce7cc5] | 1368 | struct BFSAccounting BFS;
|
---|
[cee0b57] | 1369 | atom *Walker = NULL, *OtherAtom = NULL;
|
---|
[ce7cc5] | 1370 | bond *Binder = NULL;
|
---|
[cee0b57] | 1371 |
|
---|
| 1372 | // add Root if not done yet
|
---|
[9eefda] | 1373 | if (AddedAtomList[Root->nr] == NULL) // add Root if not yet present
|
---|
[cee0b57] | 1374 | AddedAtomList[Root->nr] = Mol->AddCopyAtom(Root);
|
---|
| 1375 |
|
---|
[ea7176] | 1376 | BreadthFirstSearchAdd_Init(BFS, Root, BondOrder, getAtomCount(), AddedAtomList);
|
---|
[cee0b57] | 1377 |
|
---|
| 1378 | // and go on ... Queue always contains all lightgray vertices
|
---|
[9eefda] | 1379 | while (!BFS.BFSStack->IsEmpty()) {
|
---|
[cee0b57] | 1380 | // we have to pop the oldest atom from stack. This keeps the atoms on the stack always of the same ShortestPath distance.
|
---|
| 1381 | // e.g. if current atom is 2, push to end of stack are of length 3, but first all of length 2 would be popped. They again
|
---|
| 1382 | // append length of 3 (their neighbours). Thus on stack we have always atoms of a certain length n at bottom of stack and
|
---|
| 1383 | // followed by n+1 till top of stack.
|
---|
[9eefda] | 1384 | Walker = BFS.BFSStack->PopFirst(); // pop oldest added
|
---|
[68f03d] | 1385 | DoLog(1) && (Log() << Verbose(1) << "Current Walker is: " << Walker->getName() << ", and has " << Walker->ListOfBonds.size() << " bonds." << endl);
|
---|
[266237] | 1386 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
| 1387 | if ((*Runner) != NULL) { // don't look at bond equal NULL
|
---|
[ce7cc5] | 1388 | Binder = (*Runner);
|
---|
[266237] | 1389 | OtherAtom = (*Runner)->GetOtherAtom(Walker);
|
---|
[68f03d] | 1390 | DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
|
---|
[ce7cc5] | 1391 | if (BFS.ColorList[OtherAtom->nr] == white) {
|
---|
[e138de] | 1392 | BreadthFirstSearchAdd_UnvisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
|
---|
[cee0b57] | 1393 | } else {
|
---|
[e138de] | 1394 | BreadthFirstSearchAdd_VisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
|
---|
[cee0b57] | 1395 | }
|
---|
| 1396 | }
|
---|
| 1397 | }
|
---|
[ce7cc5] | 1398 | BFS.ColorList[Walker->nr] = black;
|
---|
[68f03d] | 1399 | DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
|
---|
[cee0b57] | 1400 | }
|
---|
[ce7cc5] | 1401 | BreadthFirstSearchAdd_Free(BFS);
|
---|
[9eefda] | 1402 | }
|
---|
| 1403 | ;
|
---|
[cee0b57] | 1404 |
|
---|
[266237] | 1405 | /** Adds a bond as a copy to a given one
|
---|
| 1406 | * \param *left leftatom of new bond
|
---|
| 1407 | * \param *right rightatom of new bond
|
---|
| 1408 | * \param *CopyBond rest of fields in bond are copied from this
|
---|
| 1409 | * \return pointer to new bond
|
---|
| 1410 | */
|
---|
| 1411 | bond * molecule::CopyBond(atom *left, atom *right, bond *CopyBond)
|
---|
| 1412 | {
|
---|
| 1413 | bond *Binder = AddBond(left, right, CopyBond->BondDegree);
|
---|
| 1414 | Binder->Cyclic = CopyBond->Cyclic;
|
---|
| 1415 | Binder->Type = CopyBond->Type;
|
---|
| 1416 | return Binder;
|
---|
[9eefda] | 1417 | }
|
---|
| 1418 | ;
|
---|
[266237] | 1419 |
|
---|
[e138de] | 1420 | void BuildInducedSubgraph_Init(atom **&ParentList, int AtomCount)
|
---|
[cee0b57] | 1421 | {
|
---|
| 1422 | // reset parent list
|
---|
[920c70] | 1423 | ParentList = new atom*[AtomCount];
|
---|
| 1424 | for (int i=0;i<AtomCount;i++)
|
---|
| 1425 | ParentList[i] = NULL;
|
---|
[a67d19] | 1426 | DoLog(3) && (Log() << Verbose(3) << "Resetting ParentList." << endl);
|
---|
[9eefda] | 1427 | }
|
---|
| 1428 | ;
|
---|
[cee0b57] | 1429 |
|
---|
[e138de] | 1430 | void BuildInducedSubgraph_FillParentList(const molecule *mol, const molecule *Father, atom **&ParentList)
|
---|
[43587e] | 1431 | {
|
---|
[cee0b57] | 1432 | // fill parent list with sons
|
---|
[a67d19] | 1433 | DoLog(3) && (Log() << Verbose(3) << "Filling Parent List." << endl);
|
---|
[9879f6] | 1434 | for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
|
---|
| 1435 | ParentList[(*iter)->father->nr] = (*iter);
|
---|
[cee0b57] | 1436 | // Outputting List for debugging
|
---|
[a7b761b] | 1437 | DoLog(4) && (Log() << Verbose(4) << "Son[" << (*iter)->father->nr << "] of " << (*iter)->father << " is " << ParentList[(*iter)->father->nr] << "." << endl);
|
---|
[cee0b57] | 1438 | }
|
---|
[a7b761b] | 1439 | };
|
---|
[43587e] | 1440 |
|
---|
[e138de] | 1441 | void BuildInducedSubgraph_Finalize(atom **&ParentList)
|
---|
[43587e] | 1442 | {
|
---|
[920c70] | 1443 | delete[](ParentList);
|
---|
[9eefda] | 1444 | }
|
---|
| 1445 | ;
|
---|
[43587e] | 1446 |
|
---|
[e138de] | 1447 | bool BuildInducedSubgraph_CreateBondsFromParent(molecule *mol, const molecule *Father, atom **&ParentList)
|
---|
[43587e] | 1448 | {
|
---|
| 1449 | bool status = true;
|
---|
| 1450 | atom *OtherAtom = NULL;
|
---|
[cee0b57] | 1451 | // check each entry of parent list and if ok (one-to-and-onto matching) create bonds
|
---|
[a67d19] | 1452 | DoLog(3) && (Log() << Verbose(3) << "Creating bonds." << endl);
|
---|
[9879f6] | 1453 | for (molecule::const_iterator iter = Father->begin(); iter != Father->end(); ++iter) {
|
---|
| 1454 | if (ParentList[(*iter)->nr] != NULL) {
|
---|
| 1455 | if (ParentList[(*iter)->nr]->father != (*iter)) {
|
---|
[cee0b57] | 1456 | status = false;
|
---|
| 1457 | } else {
|
---|
[9879f6] | 1458 | for (BondList::const_iterator Runner = (*iter)->ListOfBonds.begin(); Runner != (*iter)->ListOfBonds.end(); (++Runner)) {
|
---|
| 1459 | OtherAtom = (*Runner)->GetOtherAtom((*iter));
|
---|
[cee0b57] | 1460 | if (ParentList[OtherAtom->nr] != NULL) { // if otheratom is also a father of an atom on this molecule, create the bond
|
---|
[a7b761b] | 1461 | DoLog(4) && (Log() << Verbose(4) << "Endpoints of Bond " << (*Runner) << " are both present: " << ParentList[(*iter)->nr]->getName() << " and " << ParentList[OtherAtom->nr]->getName() << "." << endl);
|
---|
[9879f6] | 1462 | mol->AddBond(ParentList[(*iter)->nr], ParentList[OtherAtom->nr], (*Runner)->BondDegree);
|
---|
[cee0b57] | 1463 | }
|
---|
| 1464 | }
|
---|
| 1465 | }
|
---|
| 1466 | }
|
---|
| 1467 | }
|
---|
[43587e] | 1468 | return status;
|
---|
[9eefda] | 1469 | }
|
---|
| 1470 | ;
|
---|
[cee0b57] | 1471 |
|
---|
[43587e] | 1472 | /** Adds bond structure to this molecule from \a Father molecule.
|
---|
| 1473 | * This basically causes this molecule to become an induced subgraph of the \a Father, i.e. for every bond in Father
|
---|
| 1474 | * with end points present in this molecule, bond is created in this molecule.
|
---|
| 1475 | * Special care was taken to ensure that this is of complexity O(N), where N is the \a Father's molecule::AtomCount.
|
---|
| 1476 | * \param *out output stream for debugging
|
---|
| 1477 | * \param *Father father molecule
|
---|
| 1478 | * \return true - is induced subgraph, false - there are atoms with fathers not in \a Father
|
---|
| 1479 | * \todo not checked, not fully working probably
|
---|
| 1480 | */
|
---|
[e138de] | 1481 | bool molecule::BuildInducedSubgraph(const molecule *Father)
|
---|
[43587e] | 1482 | {
|
---|
| 1483 | bool status = true;
|
---|
| 1484 | atom **ParentList = NULL;
|
---|
[a67d19] | 1485 | DoLog(2) && (Log() << Verbose(2) << "Begin of BuildInducedSubgraph." << endl);
|
---|
[ea7176] | 1486 | BuildInducedSubgraph_Init(ParentList, Father->getAtomCount());
|
---|
[e138de] | 1487 | BuildInducedSubgraph_FillParentList(this, Father, ParentList);
|
---|
| 1488 | status = BuildInducedSubgraph_CreateBondsFromParent(this, Father, ParentList);
|
---|
| 1489 | BuildInducedSubgraph_Finalize(ParentList);
|
---|
[a67d19] | 1490 | DoLog(2) && (Log() << Verbose(2) << "End of BuildInducedSubgraph." << endl);
|
---|
[cee0b57] | 1491 | return status;
|
---|
[9eefda] | 1492 | }
|
---|
| 1493 | ;
|
---|
[cee0b57] | 1494 |
|
---|
| 1495 | /** For a given keyset \a *Fragment, checks whether it is connected in the current molecule.
|
---|
| 1496 | * \param *out output stream for debugging
|
---|
| 1497 | * \param *Fragment Keyset of fragment's vertices
|
---|
| 1498 | * \return true - connected, false - disconnected
|
---|
| 1499 | * \note this is O(n^2) for it's just a bug checker not meant for permanent use!
|
---|
| 1500 | */
|
---|
[e138de] | 1501 | bool molecule::CheckForConnectedSubgraph(KeySet *Fragment)
|
---|
[cee0b57] | 1502 | {
|
---|
| 1503 | atom *Walker = NULL, *Walker2 = NULL;
|
---|
| 1504 | bool BondStatus = false;
|
---|
| 1505 | int size;
|
---|
| 1506 |
|
---|
[a67d19] | 1507 | DoLog(1) && (Log() << Verbose(1) << "Begin of CheckForConnectedSubgraph" << endl);
|
---|
| 1508 | DoLog(2) && (Log() << Verbose(2) << "Disconnected atom: ");
|
---|
[cee0b57] | 1509 |
|
---|
| 1510 | // count number of atoms in graph
|
---|
| 1511 | size = 0;
|
---|
[9eefda] | 1512 | for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++)
|
---|
[cee0b57] | 1513 | size++;
|
---|
| 1514 | if (size > 1)
|
---|
[9eefda] | 1515 | for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++) {
|
---|
[cee0b57] | 1516 | Walker = FindAtom(*runner);
|
---|
| 1517 | BondStatus = false;
|
---|
[9eefda] | 1518 | for (KeySet::iterator runners = Fragment->begin(); runners != Fragment->end(); runners++) {
|
---|
[cee0b57] | 1519 | Walker2 = FindAtom(*runners);
|
---|
[266237] | 1520 | for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
|
---|
| 1521 | if ((*Runner)->GetOtherAtom(Walker) == Walker2) {
|
---|
[cee0b57] | 1522 | BondStatus = true;
|
---|
| 1523 | break;
|
---|
| 1524 | }
|
---|
| 1525 | if (BondStatus)
|
---|
| 1526 | break;
|
---|
| 1527 | }
|
---|
| 1528 | }
|
---|
| 1529 | if (!BondStatus) {
|
---|
[a67d19] | 1530 | DoLog(0) && (Log() << Verbose(0) << (*Walker) << endl);
|
---|
[cee0b57] | 1531 | return false;
|
---|
| 1532 | }
|
---|
| 1533 | }
|
---|
| 1534 | else {
|
---|
[a67d19] | 1535 | DoLog(0) && (Log() << Verbose(0) << "none." << endl);
|
---|
[cee0b57] | 1536 | return true;
|
---|
| 1537 | }
|
---|
[a67d19] | 1538 | DoLog(0) && (Log() << Verbose(0) << "none." << endl);
|
---|
[cee0b57] | 1539 |
|
---|
[a67d19] | 1540 | DoLog(1) && (Log() << Verbose(1) << "End of CheckForConnectedSubgraph" << endl);
|
---|
[cee0b57] | 1541 |
|
---|
| 1542 | return true;
|
---|
| 1543 | }
|
---|