source: src/molecule_graph.cpp@ dc1d9e

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since dc1d9e was af2c424, checked in by Frederik Heber <heber@…>, 15 years ago

LinkedCell constructor rewritten.

  • had to introduce getValue(iterator) to: molecule, tesselation, LinkedCell::LinkedNodes
  • LinkedCell::LinkedNodes is not a typedef anymore
  • new class LinkedCell::LinkedNodes derived from stl::list<TesselPoint *> to add getValue(iterator).
  • LinkedCell constructors changed:
    • use template for all classes that have begin(), end() and ... sigh ... getValue()
    • Argh! STL containers do all have begin() and end() but no consistent operator* (maps return pair<> ...)
    • specialized version for PointCloud derivatives
    • various functions had to be changed due to changed signature of LinkedCell constructor
  • Property mode set to 100644
File size: 66.2 KB
RevLine 
[bcf653]1/*
2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2010 University of Bonn. All rights reserved.
5 * Please see the LICENSE file or "Copyright notice" in builder.cpp for details.
6 */
7
[cee0b57]8/*
9 * molecule_graph.cpp
10 *
11 * Created on: Oct 5, 2009
12 * Author: heber
13 */
14
[bf3817]15// include config.h
[aafd77]16#ifdef HAVE_CONFIG_H
17#include <config.h>
18#endif
19
[112b09]20#include "Helpers/MemDebug.hpp"
21
[f66195]22#include "atom.hpp"
23#include "bond.hpp"
[b70721]24#include "bondgraph.hpp"
[cee0b57]25#include "config.hpp"
[35b698]26#include "defs.hpp"
[f66195]27#include "element.hpp"
[952f38]28#include "Helpers/helpers.hpp"
29#include "Helpers/Info.hpp"
[b8b75d]30#include "linkedcell.hpp"
[f66195]31#include "lists.hpp"
[952f38]32#include "Helpers/Verbose.hpp"
33#include "Helpers/Log.hpp"
[cee0b57]34#include "molecule.hpp"
[b34306]35#include "World.hpp"
[0a4f7f]36#include "Helpers/fast_functions.hpp"
[f2bb0f]37#include "Helpers/Assert.hpp"
[57f243]38#include "LinearAlgebra/Matrix.hpp"
[84c494]39#include "Box.hpp"
[36166d]40#include "stackclass.hpp"
[cee0b57]41
[9eefda]42struct BFSAccounting
43{
44 atom **PredecessorList;
45 int *ShortestPathList;
46 enum Shading *ColorList;
47 class StackClass<atom *> *BFSStack;
48 class StackClass<atom *> *TouchedStack;
49 int AtomCount;
50 int BondOrder;
51 atom *Root;
52 bool BackStepping;
53 int CurrentGraphNr;
54 int ComponentNr;
55};
[cee0b57]56
[9eefda]57/** Accounting data for Depth First Search.
58 */
59struct DFSAccounting
60{
61 class StackClass<atom *> *AtomStack;
62 class StackClass<bond *> *BackEdgeStack;
63 int CurrentGraphNr;
64 int ComponentNumber;
65 atom *Root;
66 bool BackStepping;
67};
68
69/************************************* Functions for class molecule *********************************/
[cee0b57]70
71/** Creates an adjacency list of the molecule.
72 * We obtain an outside file with the indices of atoms which are bondmembers.
73 */
[e138de]74void molecule::CreateAdjacencyListFromDbondFile(ifstream *input)
[cee0b57]75{
[c68c90]76 Info FunctionInfo(__func__);
[cee0b57]77 // 1 We will parse bonds out of the dbond file created by tremolo.
[44a59b]78 int atom1, atom2;
79 atom *Walker, *OtherWalker;
[c68c90]80 char line[MAXSTRINGSIZE];
[44a59b]81
[c68c90]82 if (input->fail()) {
83 DoeLog(0) && (eLog() << Verbose(0) << "Opening of bond file failed \n");
84 performCriticalExit();
[44a59b]85 };
[bd6bfa]86 doCountAtoms();
[44a59b]87
[c68c90]88 // skip header
89 input->getline(line,MAXSTRINGSIZE);
90 DoLog(1) && (Log() << Verbose(1) << "Scanning file ... \n");
[44a59b]91 while (!input->eof()) // Check whether we read everything already
92 {
[c68c90]93 input->getline(line,MAXSTRINGSIZE);
94 stringstream zeile(line);
95 zeile >> atom1;
96 zeile >> atom2;
[44a59b]97
[c68c90]98 DoLog(2) && (Log() << Verbose(2) << "Looking for atoms " << atom1 << " and " << atom2 << "." << endl);
[9eefda]99 if (atom2 < atom1) //Sort indices of atoms in order
[44a59b]100 flip(atom1, atom2);
[9eefda]101 Walker = FindAtom(atom1);
[05a97c]102 ASSERT(Walker,"Could not find an atom with the ID given in dbond file");
[9eefda]103 OtherWalker = FindAtom(atom2);
[05a97c]104 ASSERT(OtherWalker,"Could not find an atom with the ID given in dbond file");
[44a59b]105 AddBond(Walker, OtherWalker); //Add the bond between the two atoms with respective indices.
106 }
[9eefda]107}
108;
[cee0b57]109
110/** Creates an adjacency list of the molecule.
111 * Generally, we use the CSD approach to bond recognition, that is the the distance
112 * between two atoms A and B must be within [Rcov(A)+Rcov(B)-t,Rcov(A)+Rcov(B)+t] with
113 * a threshold t = 0.4 Angstroem.
114 * To make it O(N log N) the function uses the linked-cell technique as follows:
115 * The procedure is step-wise:
116 * -# Remove every bond in list
117 * -# Count the atoms in the molecule with CountAtoms()
118 * -# partition cell into smaller linked cells of size \a bonddistance
119 * -# put each atom into its corresponding cell
120 * -# go through every cell, check the atoms therein against all possible bond partners in the 27 adjacent cells, add bond if true
121 * -# correct the bond degree iteratively (single->double->triple bond)
122 * -# finally print the bond list to \a *out if desired
123 * \param *out out stream for printing the matrix, NULL if no output
124 * \param bonddistance length of linked cells (i.e. maximum minimal length checked)
125 * \param IsAngstroem whether coordinate system is gauged to Angstroem or Bohr radii
[b70721]126 * \param *minmaxdistance function to give upper and lower bound on whether particle is bonded to some other
127 * \param *BG BondGraph with the member function above or NULL, if just standard covalent should be used.
[cee0b57]128 */
[e138de]129void molecule::CreateAdjacencyList(double bonddistance, bool IsAngstroem, void (BondGraph::*minmaxdistance)(BondedParticle * const , BondedParticle * const , double &, double &, bool), BondGraph *BG)
[cee0b57]130{
[b8b75d]131 atom *Walker = NULL;
132 atom *OtherWalker = NULL;
133 int n[NDIM];
[b70721]134 double MinDistance, MaxDistance;
[b8b75d]135 LinkedCell *LC = NULL;
[b70721]136 bool free_BG = false;
[014475]137 Box &domain = World::getInstance().getDomain();
[b70721]138
139 if (BG == NULL) {
140 BG = new BondGraph(IsAngstroem);
141 free_BG = true;
142 }
[cee0b57]143
144 BondDistance = bonddistance; // * ((IsAngstroem) ? 1. : 1./AtomicLengthToAngstroem);
[a67d19]145 DoLog(0) && (Log() << Verbose(0) << "Begin of CreateAdjacencyList." << endl);
[cee0b57]146 // remove every bond from the list
[e08c46]147 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
148 for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); !(*AtomRunner)->ListOfBonds.empty(); BondRunner = (*AtomRunner)->ListOfBonds.begin())
149 if ((*BondRunner)->leftatom == *AtomRunner)
150 delete((*BondRunner));
[3c349b]151 BondCount = 0;
[cee0b57]152
153 // count atoms in molecule = dimension of matrix (also give each unique name and continuous numbering)
[a7b761b]154 DoLog(1) && (Log() << Verbose(1) << "AtomCount " << getAtomCount() << " and bonddistance is " << bonddistance << "." << endl);
[cee0b57]155
[c66537]156 if ((getAtomCount() > 1) && (bonddistance > 0.1)) {
[a67d19]157 DoLog(2) && (Log() << Verbose(2) << "Creating Linked Cell structure ... " << endl);
[af2c424]158 LC = new LinkedCell(*this, bonddistance);
[cee0b57]159
[b8b75d]160 // create a list to map Tesselpoint::nr to atom *
[a67d19]161 DoLog(2) && (Log() << Verbose(2) << "Creating TesselPoint to atom map ... " << endl);
[f2bb0f]162
[53731f]163 // set numbers for atoms that can later be used
164 int i=0;
165 for(internal_iterator iter = atoms.begin();iter!= atoms.end(); ++iter){
166 (*iter)->nr = i++;
[cee0b57]167 }
168
169 // 3a. go through every cell
[a67d19]170 DoLog(2) && (Log() << Verbose(2) << "Celling ... " << endl);
[b8b75d]171 for (LC->n[0] = 0; LC->n[0] < LC->N[0]; LC->n[0]++)
172 for (LC->n[1] = 0; LC->n[1] < LC->N[1]; LC->n[1]++)
173 for (LC->n[2] = 0; LC->n[2] < LC->N[2]; LC->n[2]++) {
[734816]174 const LinkedCell::LinkedNodes *List = LC->GetCurrentCell();
[e5ad5c]175// Log() << Verbose(2) << "Current cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
[b8b75d]176 if (List != NULL) {
[734816]177 for (LinkedCell::LinkedNodes::const_iterator Runner = List->begin(); Runner != List->end(); Runner++) {
[f2bb0f]178 Walker = dynamic_cast<atom*>(*Runner);
179 ASSERT(Walker,"Tesselpoint that was not an atom retrieved from LinkedNode");
[e138de]180 //Log() << Verbose(0) << "Current Atom is " << *Walker << "." << endl;
[cee0b57]181 // 3c. check for possible bond between each atom in this and every one in the 27 cells
[9eefda]182 for (n[0] = -1; n[0] <= 1; n[0]++)
183 for (n[1] = -1; n[1] <= 1; n[1]++)
184 for (n[2] = -1; n[2] <= 1; n[2]++) {
[734816]185 const LinkedCell::LinkedNodes *OtherList = LC->GetRelativeToCurrentCell(n);
[e5ad5c]186// Log() << Verbose(2) << "Current relative cell is " << LC->n[0] << ", " << LC->n[1] << ", " << LC->n[2] << " with No. " << LC->index << " containing " << List->size() << " points." << endl;
[b8b75d]187 if (OtherList != NULL) {
[734816]188 for (LinkedCell::LinkedNodes::const_iterator OtherRunner = OtherList->begin(); OtherRunner != OtherList->end(); OtherRunner++) {
[b8b75d]189 if ((*OtherRunner)->nr > Walker->nr) {
[f2bb0f]190 OtherWalker = dynamic_cast<atom*>(*OtherRunner);
191 ASSERT(OtherWalker,"TesselPoint that was not an atom retrieved from LinkedNode");
[e138de]192 //Log() << Verbose(1) << "Checking distance " << OtherWalker->x.PeriodicDistanceSquared(&(Walker->x), cell_size) << " against typical bond length of " << bonddistance*bonddistance << "." << endl;
[e5ad5c]193 (BG->*minmaxdistance)(Walker, OtherWalker, MinDistance, MaxDistance, IsAngstroem);
[d74077]194 const double distance = domain.periodicDistanceSquared(OtherWalker->getPosition(),Walker->getPosition());
[b70721]195 const bool status = (distance <= MaxDistance * MaxDistance) && (distance >= MinDistance * MinDistance);
[e5ad5c]196// Log() << Verbose(1) << "MinDistance is " << MinDistance << " and MaxDistance is " << MaxDistance << "." << endl;
197 if (OtherWalker->father->nr > Walker->father->nr) {
198 if (status) { // create bond if distance is smaller
199// Log() << Verbose(1) << "Adding Bond between " << *Walker << " and " << *OtherWalker << " in distance " << sqrt(distance) << "." << endl;
200 AddBond(Walker->father, OtherWalker->father, 1); // also increases molecule::BondCount
201 } else {
202// Log() << Verbose(1) << "Not Adding: distance too great." << endl;
203 }
[b8b75d]204 } else {
[e5ad5c]205// Log() << Verbose(1) << "Not Adding: Wrong order of labels." << endl;
[b8b75d]206 }
[cee0b57]207 }
208 }
209 }
210 }
211 }
212 }
213 }
[9eefda]214 delete (LC);
[a67d19]215 DoLog(1) && (Log() << Verbose(1) << "I detected " << BondCount << " bonds in the molecule with distance " << BondDistance << "." << endl);
[cee0b57]216
[b8b75d]217 // correct bond degree by comparing valence and bond degree
[a67d19]218 DoLog(2) && (Log() << Verbose(2) << "Correcting bond degree ... " << endl);
[e138de]219 CorrectBondDegree();
[cee0b57]220
[b8b75d]221 // output bonds for debugging (if bond chain list was correctly installed)
[e138de]222 ActOnAllAtoms( &atom::OutputBondOfAtom );
[b8b75d]223 } else
[a7b761b]224 DoLog(1) && (Log() << Verbose(1) << "AtomCount is " << getAtomCount() << ", thus no bonds, no connections!." << endl);
[a67d19]225 DoLog(0) && (Log() << Verbose(0) << "End of CreateAdjacencyList." << endl);
[b70721]226 if (free_BG)
227 delete(BG);
[9eefda]228}
229;
[cee0b57]230
[e08c46]231/** Checks for presence of bonds within atom list.
232 * TODO: more sophisticated check for bond structure (e.g. connected subgraph, ...)
233 * \return true - bonds present, false - no bonds
234 */
235bool molecule::hasBondStructure()
236{
237 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
238 if (!(*AtomRunner)->ListOfBonds.empty())
239 return true;
240 return false;
241}
242
243/** Counts the number of present bonds.
244 * \return number of bonds
245 */
246unsigned int molecule::CountBonds() const
247{
248 unsigned int counter = 0;
249 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
250 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
251 if ((*BondRunner)->leftatom == *AtomRunner)
252 counter++;
253 return counter;
254}
255
[b8b75d]256/** Prints a list of all bonds to \a *out.
257 * \param output stream
258 */
[e138de]259void molecule::OutputBondsList() const
[b8b75d]260{
[a67d19]261 DoLog(1) && (Log() << Verbose(1) << endl << "From contents of bond chain list:");
[e08c46]262 for(molecule::const_iterator AtomRunner = molecule::begin(); AtomRunner != molecule::end(); ++AtomRunner)
263 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
264 if ((*BondRunner)->leftatom == *AtomRunner) {
265 DoLog(0) && (Log() << Verbose(0) << *(*BondRunner) << "\t" << endl);
266 }
[a67d19]267 DoLog(0) && (Log() << Verbose(0) << endl);
[9eefda]268}
269;
[cee0b57]270
[b8b75d]271/** correct bond degree by comparing valence and bond degree.
272 * correct Bond degree of each bond by checking both bond partners for a mismatch between valence and current sum of bond degrees,
273 * iteratively increase the one first where the other bond partner has the fewest number of bonds (i.e. in general bonds oxygene
274 * preferred over carbon bonds). Beforehand, we had picked the first mismatching partner, which lead to oxygenes with single instead of
275 * double bonds as was expected.
276 * \param *out output stream for debugging
277 * \return number of bonds that could not be corrected
278 */
[e138de]279int molecule::CorrectBondDegree() const
[b8b75d]280{
[99593f]281 int No = 0, OldNo = -1;
[b8b75d]282
283 if (BondCount != 0) {
[a67d19]284 DoLog(1) && (Log() << Verbose(1) << "Correcting Bond degree of each bond ... " << endl);
[b8b75d]285 do {
[99593f]286 OldNo = No;
[e138de]287 No = SumPerAtom( &atom::CorrectBondDegree );
[99593f]288 } while (OldNo != No);
[a67d19]289 DoLog(0) && (Log() << Verbose(0) << " done." << endl);
[b8b75d]290 } else {
[a7b761b]291 DoLog(1) && (Log() << Verbose(1) << "BondCount is " << BondCount << ", no bonds between any of the " << getAtomCount() << " atoms." << endl);
[b8b75d]292 }
[a67d19]293 DoLog(0) && (Log() << Verbose(0) << No << " bonds could not be corrected." << endl);
[cee0b57]294
[266237]295 return (No);
[9eefda]296}
297;
[cee0b57]298
299/** Counts all cyclic bonds and returns their number.
300 * \note Hydrogen bonds can never by cyclic, thus no check for that
301 * \param *out output stream for debugging
302 * \return number opf cyclic bonds
303 */
[e138de]304int molecule::CountCyclicBonds()
[cee0b57]305{
[266237]306 NoCyclicBonds = 0;
[cee0b57]307 int *MinimumRingSize = NULL;
308 MoleculeLeafClass *Subgraphs = NULL;
309 class StackClass<bond *> *BackEdgeStack = NULL;
[e08c46]310 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
311 if ((!(*AtomRunner)->ListOfBonds.empty()) && ((*(*AtomRunner)->ListOfBonds.begin())->Type == Undetermined)) {
312 DoLog(0) && (Log() << Verbose(0) << "No Depth-First-Search analysis performed so far, calling ..." << endl);
313 Subgraphs = DepthFirstSearchAnalysis(BackEdgeStack);
314 while (Subgraphs->next != NULL) {
315 Subgraphs = Subgraphs->next;
316 delete (Subgraphs->previous);
317 }
318 delete (Subgraphs);
319 delete[] (MinimumRingSize);
320 break;
[cee0b57]321 }
[e08c46]322 for(molecule::iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
323 for(BondList::iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
324 if ((*BondRunner)->leftatom == *AtomRunner)
325 if ((*BondRunner)->Cyclic)
326 NoCyclicBonds++;
[9eefda]327 delete (BackEdgeStack);
[266237]328 return NoCyclicBonds;
[9eefda]329}
330;
[b8b75d]331
[cee0b57]332/** Returns Shading as a char string.
333 * \param color the Shading
334 * \return string of the flag
335 */
[fa649a]336string molecule::GetColor(enum Shading color) const
[cee0b57]337{
[9eefda]338 switch (color) {
[cee0b57]339 case white:
340 return "white";
341 break;
342 case lightgray:
343 return "lightgray";
344 break;
345 case darkgray:
346 return "darkgray";
347 break;
348 case black:
349 return "black";
350 break;
351 default:
352 return "uncolored";
353 break;
354 };
[9eefda]355}
356;
[cee0b57]357
[9eefda]358/** Sets atom::GraphNr and atom::LowpointNr to BFSAccounting::CurrentGraphNr.
359 * \param *out output stream for debugging
360 * \param *Walker current node
361 * \param &BFS structure with accounting data for BFS
362 */
[e138de]363void DepthFirstSearchAnalysis_SetWalkersGraphNr(atom *&Walker, struct DFSAccounting &DFS)
[174e0e]364{
[9eefda]365 if (!DFS.BackStepping) { // if we don't just return from (8)
366 Walker->GraphNr = DFS.CurrentGraphNr;
367 Walker->LowpointNr = DFS.CurrentGraphNr;
[68f03d]368 DoLog(1) && (Log() << Verbose(1) << "Setting Walker[" << Walker->getName() << "]'s number to " << Walker->GraphNr << " with Lowpoint " << Walker->LowpointNr << "." << endl);
[9eefda]369 DFS.AtomStack->Push(Walker);
370 DFS.CurrentGraphNr++;
[174e0e]371 }
[9eefda]372}
373;
[174e0e]374
[9eefda]375/** During DFS goes along unvisited bond and touches other atom.
376 * Sets bond::type, if
377 * -# BackEdge: set atom::LowpointNr and push on \a BackEdgeStack
378 * -# TreeEgde: set atom::Ancestor and continue with Walker along this edge
379 * Continue until molecule::FindNextUnused() finds no more unused bonds.
380 * \param *out output stream for debugging
381 * \param *mol molecule with atoms and finding unused bonds
382 * \param *&Binder current edge
383 * \param &DFS DFS accounting data
384 */
[e138de]385void DepthFirstSearchAnalysis_ProbeAlongUnusedBond(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS)
[174e0e]386{
387 atom *OtherAtom = NULL;
388
389 do { // (3) if Walker has no unused egdes, go to (5)
[9eefda]390 DFS.BackStepping = false; // reset backstepping flag for (8)
[174e0e]391 if (Binder == NULL) // if we don't just return from (11), Binder is already set to next unused
392 Binder = mol->FindNextUnused(Walker);
393 if (Binder == NULL)
394 break;
[a67d19]395 DoLog(2) && (Log() << Verbose(2) << "Current Unused Bond is " << *Binder << "." << endl);
[174e0e]396 // (4) Mark Binder used, ...
397 Binder->MarkUsed(black);
398 OtherAtom = Binder->GetOtherAtom(Walker);
[68f03d]399 DoLog(2) && (Log() << Verbose(2) << "(4) OtherAtom is " << OtherAtom->getName() << "." << endl);
[174e0e]400 if (OtherAtom->GraphNr != -1) {
401 // (4a) ... if "other" atom has been visited (GraphNr != 0), set lowpoint to minimum of both, go to (3)
402 Binder->Type = BackEdge;
[9eefda]403 DFS.BackEdgeStack->Push(Binder);
404 Walker->LowpointNr = (Walker->LowpointNr < OtherAtom->GraphNr) ? Walker->LowpointNr : OtherAtom->GraphNr;
[68f03d]405 DoLog(3) && (Log() << Verbose(3) << "(4a) Visited: Setting Lowpoint of Walker[" << Walker->getName() << "] to " << Walker->LowpointNr << "." << endl);
[174e0e]406 } else {
407 // (4b) ... otherwise set OtherAtom as Ancestor of Walker and Walker as OtherAtom, go to (2)
408 Binder->Type = TreeEdge;
409 OtherAtom->Ancestor = Walker;
410 Walker = OtherAtom;
[68f03d]411 DoLog(3) && (Log() << Verbose(3) << "(4b) Not Visited: OtherAtom[" << OtherAtom->getName() << "]'s Ancestor is now " << OtherAtom->Ancestor->getName() << ", Walker is OtherAtom " << OtherAtom->getName() << "." << endl);
[174e0e]412 break;
413 }
414 Binder = NULL;
[9eefda]415 } while (1); // (3)
416}
417;
[174e0e]418
[9eefda]419/** Checks whether we have a new component.
420 * if atom::LowpointNr of \a *&Walker is greater than atom::GraphNr of its atom::Ancestor, we have a new component.
421 * Meaning that if we touch upon a node who suddenly has a smaller atom::LowpointNr than its ancestor, then we
422 * have a found a new branch in the graph tree.
423 * \param *out output stream for debugging
424 * \param *mol molecule with atoms and finding unused bonds
425 * \param *&Walker current node
426 * \param &DFS DFS accounting data
427 */
[e138de]428void DepthFirstSearchAnalysis_CheckForaNewComponent(const molecule * const mol, atom *&Walker, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
[174e0e]429{
430 atom *OtherAtom = NULL;
431
432 // (5) if Ancestor of Walker is ...
[68f03d]433 DoLog(1) && (Log() << Verbose(1) << "(5) Number of Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "] is " << Walker->Ancestor->GraphNr << "." << endl);
[174e0e]434
[9eefda]435 if (Walker->Ancestor->GraphNr != DFS.Root->GraphNr) {
[174e0e]436 // (6) (Ancestor of Walker is not Root)
437 if (Walker->LowpointNr < Walker->Ancestor->GraphNr) {
438 // (6a) set Ancestor's Lowpoint number to minimum of of its Ancestor and itself, go to Step(8)
439 Walker->Ancestor->LowpointNr = (Walker->Ancestor->LowpointNr < Walker->LowpointNr) ? Walker->Ancestor->LowpointNr : Walker->LowpointNr;
[68f03d]440 DoLog(2) && (Log() << Verbose(2) << "(6) Setting Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s Lowpoint to " << Walker->Ancestor->LowpointNr << "." << endl);
[174e0e]441 } else {
442 // (7) (Ancestor of Walker is a separating vertex, remove all from stack till Walker (including), these and Ancestor form a component
443 Walker->Ancestor->SeparationVertex = true;
[68f03d]444 DoLog(2) && (Log() << Verbose(2) << "(7) Walker[" << Walker->getName() << "]'s Ancestor[" << Walker->Ancestor->getName() << "]'s is a separating vertex, creating component." << endl);
[9eefda]445 mol->SetNextComponentNumber(Walker->Ancestor, DFS.ComponentNumber);
[68f03d]446 DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Ancestor's Compont is " << DFS.ComponentNumber << "." << endl);
[9eefda]447 mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
[68f03d]448 DoLog(3) && (Log() << Verbose(3) << "(7) Walker[" << Walker->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]449 do {
[9eefda]450 OtherAtom = DFS.AtomStack->PopLast();
[174e0e]451 LeafWalker->Leaf->AddCopyAtom(OtherAtom);
[9eefda]452 mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
[68f03d]453 DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]454 } while (OtherAtom != Walker);
[9eefda]455 DFS.ComponentNumber++;
[174e0e]456 }
457 // (8) Walker becomes its Ancestor, go to (3)
[68f03d]458 DoLog(2) && (Log() << Verbose(2) << "(8) Walker[" << Walker->getName() << "] is now its Ancestor " << Walker->Ancestor->getName() << ", backstepping. " << endl);
[174e0e]459 Walker = Walker->Ancestor;
[9eefda]460 DFS.BackStepping = true;
[174e0e]461 }
[9eefda]462}
463;
[174e0e]464
[9eefda]465/** Cleans the root stack when we have found a component.
466 * If we are not DFSAccounting::BackStepping, then we clear the root stack by putting everything into a
467 * component down till we meet DFSAccounting::Root.
468 * \param *out output stream for debugging
469 * \param *mol molecule with atoms and finding unused bonds
470 * \param *&Walker current node
471 * \param *&Binder current edge
472 * \param &DFS DFS accounting data
473 */
[e138de]474void DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(const molecule * const mol, atom *&Walker, bond *&Binder, struct DFSAccounting &DFS, MoleculeLeafClass *&LeafWalker)
[174e0e]475{
476 atom *OtherAtom = NULL;
477
[9eefda]478 if (!DFS.BackStepping) { // coming from (8) want to go to (3)
[174e0e]479 // (9) remove all from stack till Walker (including), these and Root form a component
[99593f]480 //DFS.AtomStack->Output(out);
[9eefda]481 mol->SetNextComponentNumber(DFS.Root, DFS.ComponentNumber);
[68f03d]482 DoLog(3) && (Log() << Verbose(3) << "(9) Root[" << DFS.Root->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
[9eefda]483 mol->SetNextComponentNumber(Walker, DFS.ComponentNumber);
[68f03d]484 DoLog(3) && (Log() << Verbose(3) << "(9) Walker[" << Walker->getName() << "]'s Component is " << DFS.ComponentNumber << "." << endl);
[174e0e]485 do {
[9eefda]486 OtherAtom = DFS.AtomStack->PopLast();
[174e0e]487 LeafWalker->Leaf->AddCopyAtom(OtherAtom);
[9eefda]488 mol->SetNextComponentNumber(OtherAtom, DFS.ComponentNumber);
[68f03d]489 DoLog(3) && (Log() << Verbose(3) << "(7) Other[" << OtherAtom->getName() << "]'s Compont is " << DFS.ComponentNumber << "." << endl);
[174e0e]490 } while (OtherAtom != Walker);
[9eefda]491 DFS.ComponentNumber++;
[174e0e]492
493 // (11) Root is separation vertex, set Walker to Root and go to (4)
[9eefda]494 Walker = DFS.Root;
[174e0e]495 Binder = mol->FindNextUnused(Walker);
[68f03d]496 DoLog(1) && (Log() << Verbose(1) << "(10) Walker is Root[" << DFS.Root->getName() << "], next Unused Bond is " << Binder << "." << endl);
[174e0e]497 if (Binder != NULL) { // Root is separation vertex
[a67d19]498 DoLog(1) && (Log() << Verbose(1) << "(11) Root is a separation vertex." << endl);
[174e0e]499 Walker->SeparationVertex = true;
500 }
501 }
[9eefda]502}
503;
504
505/** Initializes DFSAccounting structure.
506 * \param *out output stream for debugging
507 * \param &DFS accounting structure to allocate
[7218f8]508 * \param *mol molecule with AtomCount, BondCount and all atoms
[9eefda]509 */
[e138de]510void DepthFirstSearchAnalysis_Init(struct DFSAccounting &DFS, const molecule * const mol)
[9eefda]511{
[ea7176]512 DFS.AtomStack = new StackClass<atom *> (mol->getAtomCount());
[9eefda]513 DFS.CurrentGraphNr = 0;
514 DFS.ComponentNumber = 0;
515 DFS.BackStepping = false;
[7218f8]516 mol->ResetAllBondsToUnused();
517 mol->SetAtomValueToValue(-1, &atom::GraphNr);
518 mol->ActOnAllAtoms(&atom::InitComponentNr);
519 DFS.BackEdgeStack->ClearStack();
[9eefda]520}
521;
[174e0e]522
[9eefda]523/** Free's DFSAccounting structure.
524 * \param *out output stream for debugging
525 * \param &DFS accounting structure to free
526 */
[e138de]527void DepthFirstSearchAnalysis_Finalize(struct DFSAccounting &DFS)
[9eefda]528{
529 delete (DFS.AtomStack);
[7218f8]530 // delete (DFS.BackEdgeStack); // DON'T free, see DepthFirstSearchAnalysis(), is returned as allocated
[9eefda]531}
532;
[174e0e]533
[cee0b57]534/** Performs a Depth-First search on this molecule.
535 * Marks bonds in molecule as cyclic, bridge, ... and atoms as
536 * articulations points, ...
537 * We use the algorithm from [Even, Graph Algorithms, p.62].
538 * \param *out output stream for debugging
539 * \param *&BackEdgeStack NULL pointer to StackClass with all the found back edges, allocated and filled on return
540 * \return list of each disconnected subgraph as an individual molecule class structure
541 */
[e138de]542MoleculeLeafClass * molecule::DepthFirstSearchAnalysis(class StackClass<bond *> *&BackEdgeStack) const
[cee0b57]543{
[9eefda]544 struct DFSAccounting DFS;
[cee0b57]545 BackEdgeStack = new StackClass<bond *> (BondCount);
[9eefda]546 DFS.BackEdgeStack = BackEdgeStack;
[cee0b57]547 MoleculeLeafClass *SubGraphs = new MoleculeLeafClass(NULL);
548 MoleculeLeafClass *LeafWalker = SubGraphs;
[9eefda]549 int OldGraphNr = 0;
[174e0e]550 atom *Walker = NULL;
[cee0b57]551 bond *Binder = NULL;
552
[a7b761b]553 if (getAtomCount() == 0)
[046783]554 return SubGraphs;
[a67d19]555 DoLog(0) && (Log() << Verbose(0) << "Begin of DepthFirstSearchAnalysis" << endl);
[e138de]556 DepthFirstSearchAnalysis_Init(DFS, this);
[cee0b57]557
[9879f6]558 for (molecule::const_iterator iter = begin(); iter != end();) {
559 DFS.Root = *iter;
[7218f8]560 // (1) mark all edges unused, empty stack, set atom->GraphNr = -1 for all
[9eefda]561 DFS.AtomStack->ClearStack();
[cee0b57]562
563 // put into new subgraph molecule and add this to list of subgraphs
564 LeafWalker = new MoleculeLeafClass(LeafWalker);
[5f612ee]565 LeafWalker->Leaf = World::getInstance().createMolecule();
[9eefda]566 LeafWalker->Leaf->AddCopyAtom(DFS.Root);
[cee0b57]567
[9eefda]568 OldGraphNr = DFS.CurrentGraphNr;
569 Walker = DFS.Root;
[cee0b57]570 do { // (10)
571 do { // (2) set number and Lowpoint of Atom to i, increase i, push current atom
[e138de]572 DepthFirstSearchAnalysis_SetWalkersGraphNr(Walker, DFS);
[174e0e]573
[e138de]574 DepthFirstSearchAnalysis_ProbeAlongUnusedBond(this, Walker, Binder, DFS);
[174e0e]575
[cee0b57]576 if (Binder == NULL) {
[a67d19]577 DoLog(2) && (Log() << Verbose(2) << "No more Unused Bonds." << endl);
[cee0b57]578 break;
579 } else
580 Binder = NULL;
[9eefda]581 } while (1); // (2)
[cee0b57]582
583 // if we came from backstepping, yet there were no more unused bonds, we end up here with no Ancestor, because Walker is Root! Then we are finished!
[9eefda]584 if ((Walker == DFS.Root) && (Binder == NULL))
[cee0b57]585 break;
586
[e138de]587 DepthFirstSearchAnalysis_CheckForaNewComponent(this, Walker, DFS, LeafWalker);
[174e0e]588
[e138de]589 DepthFirstSearchAnalysis_CleanRootStackDownTillWalker(this, Walker, Binder, DFS, LeafWalker);
[174e0e]590
[9eefda]591 } while ((DFS.BackStepping) || (Binder != NULL)); // (10) halt only if Root has no unused edges
[cee0b57]592
593 // From OldGraphNr to CurrentGraphNr ranges an disconnected subgraph
[a67d19]594 DoLog(0) && (Log() << Verbose(0) << "Disconnected subgraph ranges from " << OldGraphNr << " to " << DFS.CurrentGraphNr << "." << endl);
[986ed3]595 LeafWalker->Leaf->Output((ofstream *)&(Log() << Verbose(0)));
[a67d19]596 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]597
598 // step on to next root
[9879f6]599 while ((iter != end()) && ((*iter)->GraphNr != -1)) {
600 //Log() << Verbose(1) << "Current next subgraph root candidate is " << (*iter)->Name << "." << endl;
601 if ((*iter)->GraphNr != -1) // if already discovered, step on
602 iter++;
[cee0b57]603 }
604 }
605 // set cyclic bond criterium on "same LP" basis
[266237]606 CyclicBondAnalysis();
607
[e138de]608 OutputGraphInfoPerAtom();
[266237]609
[e138de]610 OutputGraphInfoPerBond();
[266237]611
612 // free all and exit
[e138de]613 DepthFirstSearchAnalysis_Finalize(DFS);
[a67d19]614 DoLog(0) && (Log() << Verbose(0) << "End of DepthFirstSearchAnalysis" << endl);
[266237]615 return SubGraphs;
[9eefda]616}
617;
[266237]618
619/** Scans through all bonds and set bond::Cyclic to true where atom::LowpointNr of both ends is equal: LP criterion.
620 */
[fa649a]621void molecule::CyclicBondAnalysis() const
[266237]622{
623 NoCyclicBonds = 0;
[e08c46]624 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
625 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
626 if ((*BondRunner)->leftatom == *AtomRunner)
627 if ((*BondRunner)->rightatom->LowpointNr == (*BondRunner)->leftatom->LowpointNr) { // cyclic ??
628 (*BondRunner)->Cyclic = true;
629 NoCyclicBonds++;
630 }
[9eefda]631}
632;
[cee0b57]633
[266237]634/** Output graph information per atom.
635 * \param *out output stream
636 */
[e138de]637void molecule::OutputGraphInfoPerAtom() const
[266237]638{
[a67d19]639 DoLog(1) && (Log() << Verbose(1) << "Final graph info for each atom is:" << endl);
[e138de]640 ActOnAllAtoms( &atom::OutputGraphInfo );
[9eefda]641}
642;
[cee0b57]643
[266237]644/** Output graph information per bond.
645 * \param *out output stream
646 */
[e138de]647void molecule::OutputGraphInfoPerBond() const
[266237]648{
[e08c46]649 bond *Binder = NULL;
[a67d19]650 DoLog(1) && (Log() << Verbose(1) << "Final graph info for each bond is:" << endl);
[e08c46]651 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
[bd6bfa]652 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
[e08c46]653 if ((*BondRunner)->leftatom == *AtomRunner) {
654 Binder = *BondRunner;
[f9183b]655 if (DoLog(2)) {
656 ostream &out = (Log() << Verbose(2));
657 out << ((Binder->Type == TreeEdge) ? "TreeEdge " : "BackEdge ") << *Binder << ": <";
658 out << ((Binder->leftatom->SeparationVertex) ? "SP," : "") << "L" << Binder->leftatom->LowpointNr << " G" << Binder->leftatom->GraphNr << " Comp.";
659 Binder->leftatom->OutputComponentNumber(&out);
660 out << " === ";
661 out << ((Binder->rightatom->SeparationVertex) ? "SP," : "") << "L" << Binder->rightatom->LowpointNr << " G" << Binder->rightatom->GraphNr << " Comp.";
662 Binder->rightatom->OutputComponentNumber(&out);
663 out << ">." << endl;
664 }
[e08c46]665 if (Binder->Cyclic) // cyclic ??
666 DoLog(3) && (Log() << Verbose(3) << "Lowpoint at each side are equal: CYCLIC!" << endl);
667 }
[9eefda]668}
669;
670
671/** Initialise each vertex as white with no predecessor, empty queue, color Root lightgray.
672 * \param *out output stream for debugging
673 * \param &BFS accounting structure
674 * \param AtomCount number of entries in the array to allocate
675 */
[e138de]676void InitializeBFSAccounting(struct BFSAccounting &BFS, int AtomCount)
[9eefda]677{
678 BFS.AtomCount = AtomCount;
[920c70]679 BFS.PredecessorList = new atom*[AtomCount];
680 BFS.ShortestPathList = new int[AtomCount];
681 BFS.ColorList = new enum Shading[AtomCount];
[9eefda]682 BFS.BFSStack = new StackClass<atom *> (AtomCount);
[c27778]683 BFS.TouchedStack = new StackClass<atom *> (AtomCount);
[9eefda]684
[920c70]685 for (int i = AtomCount; i--;) {
[9eefda]686 BFS.ShortestPathList[i] = -1;
[920c70]687 BFS.PredecessorList[i] = 0;
[c27778]688 BFS.ColorList[i] = white;
[920c70]689 }
[cee0b57]690};
691
[9eefda]692/** Free's accounting structure.
693 * \param *out output stream for debugging
694 * \param &BFS accounting structure
695 */
[e138de]696void FinalizeBFSAccounting(struct BFSAccounting &BFS)
[9eefda]697{
[920c70]698 delete[](BFS.PredecessorList);
699 delete[](BFS.ShortestPathList);
700 delete[](BFS.ColorList);
[9eefda]701 delete (BFS.BFSStack);
[c27778]702 delete (BFS.TouchedStack);
[9eefda]703 BFS.AtomCount = 0;
704};
705
706/** Clean the accounting structure.
707 * \param *out output stream for debugging
708 * \param &BFS accounting structure
[ef9aae]709 */
[e138de]710void CleanBFSAccounting(struct BFSAccounting &BFS)
[ef9aae]711{
[9eefda]712 atom *Walker = NULL;
713 while (!BFS.TouchedStack->IsEmpty()) {
714 Walker = BFS.TouchedStack->PopFirst();
715 BFS.PredecessorList[Walker->nr] = NULL;
716 BFS.ShortestPathList[Walker->nr] = -1;
717 BFS.ColorList[Walker->nr] = white;
[ef9aae]718 }
719};
720
[9eefda]721/** Resets shortest path list and BFSStack.
722 * \param *out output stream for debugging
723 * \param *&Walker current node, pushed onto BFSAccounting::BFSStack and BFSAccounting::TouchedStack
724 * \param &BFS accounting structure
725 */
[e138de]726void ResetBFSAccounting(atom *&Walker, struct BFSAccounting &BFS)
[ef9aae]727{
[9eefda]728 BFS.ShortestPathList[Walker->nr] = 0;
729 BFS.BFSStack->ClearStack(); // start with empty BFS stack
730 BFS.BFSStack->Push(Walker);
731 BFS.TouchedStack->Push(Walker);
[ef9aae]732};
733
[9eefda]734/** Performs a BFS from \a *Root, trying to find the same node and hence a cycle.
735 * \param *out output stream for debugging
736 * \param *&BackEdge the edge from root that we don't want to move along
737 * \param &BFS accounting structure
738 */
[e138de]739void CyclicStructureAnalysis_CyclicBFSFromRootToRoot(bond *&BackEdge, struct BFSAccounting &BFS)
[ef9aae]740{
741 atom *Walker = NULL;
742 atom *OtherAtom = NULL;
[9eefda]743 do { // look for Root
744 Walker = BFS.BFSStack->PopFirst();
[a67d19]745 DoLog(2) && (Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *BFS.Root << "." << endl);
[ef9aae]746 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
747 if ((*Runner) != BackEdge) { // only walk along DFS spanning tree (otherwise we always find SP of one being backedge Binder)
748 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[9eefda]749#ifdef ADDHYDROGEN
[83f176]750 if (OtherAtom->getType()->getAtomicNumber() != 1) {
[9eefda]751#endif
[68f03d]752 DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
[9eefda]753 if (BFS.ColorList[OtherAtom->nr] == white) {
754 BFS.TouchedStack->Push(OtherAtom);
755 BFS.ColorList[OtherAtom->nr] = lightgray;
756 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
757 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[68f03d]758 DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " lightgray, its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
[9eefda]759 //if (BFS.ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr]) { // Check for maximum distance
[a67d19]760 DoLog(3) && (Log() << Verbose(3) << "Putting OtherAtom into queue." << endl);
[9eefda]761 BFS.BFSStack->Push(OtherAtom);
762 //}
[ef9aae]763 } else {
[a67d19]764 DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
[ef9aae]765 }
[9eefda]766 if (OtherAtom == BFS.Root)
767 break;
768#ifdef ADDHYDROGEN
769 } else {
[a67d19]770 DoLog(2) && (Log() << Verbose(2) << "Skipping hydrogen atom " << *OtherAtom << "." << endl);
[9eefda]771 BFS.ColorList[OtherAtom->nr] = black;
772 }
773#endif
[ef9aae]774 } else {
[a67d19]775 DoLog(2) && (Log() << Verbose(2) << "Bond " << *(*Runner) << " not Visiting, is the back edge." << endl);
[ef9aae]776 }
777 }
[9eefda]778 BFS.ColorList[Walker->nr] = black;
[68f03d]779 DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
[9eefda]780 if (OtherAtom == BFS.Root) { // if we have found the root, check whether this cycle wasn't already found beforehand
[ef9aae]781 // step through predecessor list
782 while (OtherAtom != BackEdge->rightatom) {
[9eefda]783 if (!OtherAtom->GetTrueFather()->IsCyclic) // if one bond in the loop is not marked as cyclic, we haven't found this cycle yet
[ef9aae]784 break;
785 else
[9eefda]786 OtherAtom = BFS.PredecessorList[OtherAtom->nr];
[ef9aae]787 }
788 if (OtherAtom == BackEdge->rightatom) { // if each atom in found cycle is cyclic, loop's been found before already
[a67d19]789 DoLog(3) && (Log() << Verbose(3) << "This cycle was already found before, skipping and removing seeker from search." << endl);
[ef9aae]790 do {
[9eefda]791 OtherAtom = BFS.TouchedStack->PopLast();
792 if (BFS.PredecessorList[OtherAtom->nr] == Walker) {
[a67d19]793 DoLog(4) && (Log() << Verbose(4) << "Removing " << *OtherAtom << " from lists and stacks." << endl);
[9eefda]794 BFS.PredecessorList[OtherAtom->nr] = NULL;
795 BFS.ShortestPathList[OtherAtom->nr] = -1;
796 BFS.ColorList[OtherAtom->nr] = white;
797 BFS.BFSStack->RemoveItem(OtherAtom);
[ef9aae]798 }
[9eefda]799 } while ((!BFS.TouchedStack->IsEmpty()) && (BFS.PredecessorList[OtherAtom->nr] == NULL));
800 BFS.TouchedStack->Push(OtherAtom); // last was wrongly popped
[ef9aae]801 OtherAtom = BackEdge->rightatom; // set to not Root
802 } else
[9eefda]803 OtherAtom = BFS.Root;
[ef9aae]804 }
[9eefda]805 } while ((!BFS.BFSStack->IsEmpty()) && (OtherAtom != BFS.Root) && (OtherAtom != NULL)); // || (ShortestPathList[OtherAtom->nr] < MinimumRingSize[Walker->GetTrueFather()->nr])));
[ef9aae]806};
807
[9eefda]808/** Climb back the BFSAccounting::PredecessorList and find cycle members.
809 * \param *out output stream for debugging
810 * \param *&OtherAtom
811 * \param *&BackEdge denotes the edge we did not want to travel along when doing CyclicBFSFromRootToRoot()
812 * \param &BFS accounting structure
813 * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
814 * \param &MinRingSize global minimum distance from one node without encountering oneself, set on return
815 */
[e138de]816void CyclicStructureAnalysis_RetrieveCycleMembers(atom *&OtherAtom, bond *&BackEdge, struct BFSAccounting &BFS, int *&MinimumRingSize, int &MinRingSize)
[ef9aae]817{
818 atom *Walker = NULL;
819 int NumCycles = 0;
820 int RingSize = -1;
821
[9eefda]822 if (OtherAtom == BFS.Root) {
[ef9aae]823 // now climb back the predecessor list and thus find the cycle members
824 NumCycles++;
825 RingSize = 1;
[9eefda]826 BFS.Root->GetTrueFather()->IsCyclic = true;
[a67d19]827 DoLog(1) && (Log() << Verbose(1) << "Found ring contains: ");
[9eefda]828 Walker = BFS.Root;
[ef9aae]829 while (Walker != BackEdge->rightatom) {
[68f03d]830 DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " <-> ");
[9eefda]831 Walker = BFS.PredecessorList[Walker->nr];
[ef9aae]832 Walker->GetTrueFather()->IsCyclic = true;
833 RingSize++;
834 }
[68f03d]835 DoLog(0) && (Log() << Verbose(0) << Walker->getName() << " with a length of " << RingSize << "." << endl << endl);
[ef9aae]836 // walk through all and set MinimumRingSize
[9eefda]837 Walker = BFS.Root;
[ef9aae]838 MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
839 while (Walker != BackEdge->rightatom) {
[9eefda]840 Walker = BFS.PredecessorList[Walker->nr];
[ef9aae]841 if (RingSize < MinimumRingSize[Walker->GetTrueFather()->nr])
842 MinimumRingSize[Walker->GetTrueFather()->nr] = RingSize;
843 }
844 if ((RingSize < MinRingSize) || (MinRingSize == -1))
845 MinRingSize = RingSize;
846 } else {
[c27778]847 DoLog(1) && (Log() << Verbose(1) << "No ring containing " << *BFS.Root << " with length equal to or smaller than " << MinimumRingSize[BFS.Root->GetTrueFather()->nr] << " found." << endl);
[ef9aae]848 }
849};
850
[9eefda]851/** From a given node performs a BFS to touch the next cycle, for whose nodes \a *&MinimumRingSize is set and set it accordingly.
852 * \param *out output stream for debugging
853 * \param *&Root node to look for closest cycle from, i.e. \a *&MinimumRingSize is set for this node
854 * \param *&MinimumRingSize minimum distance from this node possible without encountering oneself, set on return for each atom
855 * \param AtomCount number of nodes in graph
856 */
[e138de]857void CyclicStructureAnalysis_BFSToNextCycle(atom *&Root, atom *&Walker, int *&MinimumRingSize, int AtomCount)
[ef9aae]858{
[9eefda]859 struct BFSAccounting BFS;
[ef9aae]860 atom *OtherAtom = Walker;
861
[e138de]862 InitializeBFSAccounting(BFS, AtomCount);
[ef9aae]863
[e138de]864 ResetBFSAccounting(Walker, BFS);
[9eefda]865 while (OtherAtom != NULL) { // look for Root
866 Walker = BFS.BFSStack->PopFirst();
[e138de]867 //Log() << Verbose(2) << "Current Walker is " << *Walker << ", we look for SP to Root " << *Root << "." << endl;
[ef9aae]868 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
[9eefda]869 // "removed (*Runner) != BackEdge) || " from next if, is u
870 if ((Walker->ListOfBonds.size() == 1)) { // only walk along DFS spanning tree (otherwise we always find SP of 1 being backedge Binder), but terminal hydrogens may be connected via backedge, hence extra check
[ef9aae]871 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[e138de]872 //Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->Name << " for bond " << *Binder << "." << endl;
[9eefda]873 if (BFS.ColorList[OtherAtom->nr] == white) {
874 BFS.TouchedStack->Push(OtherAtom);
875 BFS.ColorList[OtherAtom->nr] = lightgray;
876 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
877 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[e138de]878 //Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->Name << " lightgray, its predecessor is " << Walker->Name << " and its Shortest Path is " << ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl;
[ef9aae]879 if (OtherAtom->GetTrueFather()->IsCyclic) { // if the other atom is connected to a ring
[9eefda]880 MinimumRingSize[Root->GetTrueFather()->nr] = BFS.ShortestPathList[OtherAtom->nr] + MinimumRingSize[OtherAtom->GetTrueFather()->nr];
[ef9aae]881 OtherAtom = NULL; //break;
882 break;
883 } else
[9eefda]884 BFS.BFSStack->Push(OtherAtom);
[ef9aae]885 } else {
[e138de]886 //Log() << Verbose(3) << "Not Adding, has already been visited." << endl;
[ef9aae]887 }
888 } else {
[e138de]889 //Log() << Verbose(3) << "Not Visiting, is a back edge." << endl;
[ef9aae]890 }
891 }
[9eefda]892 BFS.ColorList[Walker->nr] = black;
[e138de]893 //Log() << Verbose(1) << "Coloring Walker " << Walker->Name << " black." << endl;
[ef9aae]894 }
895 //CleanAccountingLists(TouchedStack, PredecessorList, ShortestPathList, ColorList);
896
[e138de]897 FinalizeBFSAccounting(BFS);
[9eefda]898}
899;
[ef9aae]900
[9eefda]901/** All nodes that are not in cycles get assigned a \a *&MinimumRingSizeby BFS to next cycle.
902 * \param *out output stream for debugging
903 * \param *&MinimumRingSize array with minimum distance without encountering onself for each atom
904 * \param &MinRingSize global minium distance
905 * \param &NumCyles number of cycles in graph
906 * \param *mol molecule with atoms
907 */
[e138de]908void CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(int *&MinimumRingSize, int &MinRingSize, int &NumCycles, const molecule * const mol)
[ef9aae]909{
[9eefda]910 atom *Root = NULL;
[ef9aae]911 atom *Walker = NULL;
912 if (MinRingSize != -1) { // if rings are present
913 // go over all atoms
[9879f6]914 for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
915 Root = *iter;
[ef9aae]916
[ea7176]917 if (MinimumRingSize[Root->GetTrueFather()->nr] == mol->getAtomCount()) { // check whether MinimumRingSize is set, if not BFS to next where it is
[ef9aae]918 Walker = Root;
919
[e138de]920 //Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl;
[ea7176]921 CyclicStructureAnalysis_BFSToNextCycle(Root, Walker, MinimumRingSize, mol->getAtomCount());
[ef9aae]922
923 }
[a67d19]924 DoLog(1) && (Log() << Verbose(1) << "Minimum ring size of " << *Root << " is " << MinimumRingSize[Root->GetTrueFather()->nr] << "." << endl);
[ef9aae]925 }
[a67d19]926 DoLog(1) && (Log() << Verbose(1) << "Minimum ring size is " << MinRingSize << ", over " << NumCycles << " cycles total." << endl);
[ef9aae]927 } else
[a67d19]928 DoLog(1) && (Log() << Verbose(1) << "No rings were detected in the molecular structure." << endl);
[9eefda]929}
930;
[ef9aae]931
[cee0b57]932/** Analyses the cycles found and returns minimum of all cycle lengths.
933 * We begin with a list of Back edges found during DepthFirstSearchAnalysis(). We go through this list - one end is the Root,
934 * the other our initial Walker - and do a Breadth First Search for the Root. We mark down each Predecessor and as soon as
935 * we have found the Root via BFS, we may climb back the closed cycle via the Predecessors. Thereby we mark atoms and bonds
936 * as cyclic and print out the cycles.
937 * \param *out output stream for debugging
938 * \param *BackEdgeStack stack with all back edges found during DFS scan. Beware: This stack contains the bonds from the total molecule, not from the subgraph!
939 * \param *&MinimumRingSize contains smallest ring size in molecular structure on return or -1 if no rings were found, if set is maximum search distance
940 * \todo BFS from the not-same-LP to find back to starting point of tributary cycle over more than one bond
941 */
[e138de]942void molecule::CyclicStructureAnalysis(class StackClass<bond *> * BackEdgeStack, int *&MinimumRingSize) const
[cee0b57]943{
[9eefda]944 struct BFSAccounting BFS;
[ef9aae]945 atom *Walker = NULL;
946 atom *OtherAtom = NULL;
947 bond *BackEdge = NULL;
948 int NumCycles = 0;
949 int MinRingSize = -1;
[cee0b57]950
[ea7176]951 InitializeBFSAccounting(BFS, getAtomCount());
[cee0b57]952
[e138de]953 //Log() << Verbose(1) << "Back edge list - ";
[99593f]954 //BackEdgeStack->Output(out);
[cee0b57]955
[a67d19]956 DoLog(1) && (Log() << Verbose(1) << "Analysing cycles ... " << endl);
[cee0b57]957 NumCycles = 0;
958 while (!BackEdgeStack->IsEmpty()) {
959 BackEdge = BackEdgeStack->PopFirst();
960 // this is the target
[9eefda]961 BFS.Root = BackEdge->leftatom;
[cee0b57]962 // this is the source point
963 Walker = BackEdge->rightatom;
964
[e138de]965 ResetBFSAccounting(Walker, BFS);
[cee0b57]966
[a67d19]967 DoLog(1) && (Log() << Verbose(1) << "---------------------------------------------------------------------------------------------------------" << endl);
[ef9aae]968 OtherAtom = NULL;
[e138de]969 CyclicStructureAnalysis_CyclicBFSFromRootToRoot(BackEdge, BFS);
[cee0b57]970
[e138de]971 CyclicStructureAnalysis_RetrieveCycleMembers(OtherAtom, BackEdge, BFS, MinimumRingSize, MinRingSize);
[cee0b57]972
[e138de]973 CleanBFSAccounting(BFS);
[ef9aae]974 }
[e138de]975 FinalizeBFSAccounting(BFS);
[ef9aae]976
[e138de]977 CyclicStructureAnalysis_AssignRingSizetoNonCycleMembers(MinimumRingSize, MinRingSize, NumCycles, this);
[fa649a]978};
[cee0b57]979
980/** Sets the next component number.
981 * This is O(N) as the number of bonds per atom is bound.
982 * \param *vertex atom whose next atom::*ComponentNr is to be set
983 * \param nr number to use
984 */
[fa649a]985void molecule::SetNextComponentNumber(atom *vertex, int nr) const
[cee0b57]986{
[9eefda]987 size_t i = 0;
[cee0b57]988 if (vertex != NULL) {
[9eefda]989 for (; i < vertex->ListOfBonds.size(); i++) {
990 if (vertex->ComponentNr[i] == -1) { // check if not yet used
[cee0b57]991 vertex->ComponentNr[i] = nr;
992 break;
[9eefda]993 } else if (vertex->ComponentNr[i] == nr) // if number is already present, don't add another time
994 break; // breaking here will not cause error!
[cee0b57]995 }
[e359a8]996 if (i == vertex->ListOfBonds.size()) {
[58ed4a]997 DoeLog(0) && (eLog()<< Verbose(0) << "Error: All Component entries are already occupied!" << endl);
[e359a8]998 performCriticalExit();
999 }
1000 } else {
[58ed4a]1001 DoeLog(0) && (eLog()<< Verbose(0) << "Error: Given vertex is NULL!" << endl);
[e359a8]1002 performCriticalExit();
1003 }
[9eefda]1004}
1005;
[cee0b57]1006
1007/** Returns next unused bond for this atom \a *vertex or NULL of none exists.
1008 * \param *vertex atom to regard
1009 * \return bond class or NULL
1010 */
[fa649a]1011bond * molecule::FindNextUnused(atom *vertex) const
[cee0b57]1012{
[266237]1013 for (BondList::const_iterator Runner = vertex->ListOfBonds.begin(); Runner != vertex->ListOfBonds.end(); (++Runner))
1014 if ((*Runner)->IsUsed() == white)
[9eefda]1015 return ((*Runner));
[cee0b57]1016 return NULL;
[9eefda]1017}
1018;
[cee0b57]1019
1020/** Resets bond::Used flag of all bonds in this molecule.
1021 * \return true - success, false - -failure
1022 */
[fa649a]1023void molecule::ResetAllBondsToUnused() const
[cee0b57]1024{
[e08c46]1025 for(molecule::const_iterator AtomRunner = begin(); AtomRunner != end(); ++AtomRunner)
1026 for(BondList::const_iterator BondRunner = (*AtomRunner)->ListOfBonds.begin(); BondRunner != (*AtomRunner)->ListOfBonds.end(); ++BondRunner)
1027 if ((*BondRunner)->leftatom == *AtomRunner)
1028 (*BondRunner)->ResetUsed();
[9eefda]1029}
1030;
[cee0b57]1031
1032/** Output a list of flags, stating whether the bond was visited or not.
1033 * \param *out output stream for debugging
1034 * \param *list
1035 */
[e138de]1036void OutputAlreadyVisited(int *list)
[cee0b57]1037{
[a67d19]1038 DoLog(4) && (Log() << Verbose(4) << "Already Visited Bonds:\t");
[9eefda]1039 for (int i = 1; i <= list[0]; i++)
[a67d19]1040 DoLog(0) && (Log() << Verbose(0) << list[i] << " ");
1041 DoLog(0) && (Log() << Verbose(0) << endl);
[9eefda]1042}
1043;
[cee0b57]1044
1045/** Storing the bond structure of a molecule to file.
1046 * Simply stores Atom::nr and then the Atom::nr of all bond partners per line.
[35b698]1047 * \param &filename name of file
1048 * \param path path to file, defaults to empty
[cee0b57]1049 * \return true - file written successfully, false - writing failed
1050 */
[35b698]1051bool molecule::StoreAdjacencyToFile(std::string &filename, std::string path)
[cee0b57]1052{
1053 ofstream AdjacencyFile;
[35b698]1054 string line;
[cee0b57]1055 bool status = true;
1056
[35b698]1057 if (path != "")
1058 line = path + "/" + filename;
[8ab0407]1059 else
[35b698]1060 line = filename;
1061 AdjacencyFile.open(line.c_str(), ios::out);
[acf800]1062 DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
[35b698]1063 if (AdjacencyFile.good()) {
[1f1b23]1064 AdjacencyFile << "m\tn" << endl;
[9eefda]1065 ActOnAllAtoms(&atom::OutputAdjacency, &AdjacencyFile);
[cee0b57]1066 AdjacencyFile.close();
[acf800]1067 DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
[cee0b57]1068 } else {
[35b698]1069 DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
[cee0b57]1070 status = false;
1071 }
1072
1073 return status;
[9eefda]1074}
1075;
[cee0b57]1076
[1f1b23]1077/** Storing the bond structure of a molecule to file.
1078 * Simply stores Atom::nr and then the Atom::nr of all bond partners, one per line.
[35b698]1079 * \param &filename name of file
1080 * \param path path to file, defaults to empty
[1f1b23]1081 * \return true - file written successfully, false - writing failed
1082 */
[35b698]1083bool molecule::StoreBondsToFile(std::string &filename, std::string path)
[1f1b23]1084{
1085 ofstream BondFile;
[35b698]1086 string line;
[1f1b23]1087 bool status = true;
1088
[35b698]1089 if (path != "")
1090 line = path + "/" + filename;
[8ab0407]1091 else
[35b698]1092 line = filename;
1093 BondFile.open(line.c_str(), ios::out);
[acf800]1094 DoLog(1) && (Log() << Verbose(1) << "Saving adjacency list ... " << endl);
[35b698]1095 if (BondFile.good()) {
[1f1b23]1096 BondFile << "m\tn" << endl;
1097 ActOnAllAtoms(&atom::OutputBonds, &BondFile);
1098 BondFile.close();
[acf800]1099 DoLog(1) && (Log() << Verbose(1) << "\t... done." << endl);
[1f1b23]1100 } else {
[35b698]1101 DoLog(1) && (Log() << Verbose(1) << "\t... failed to open file " << line << "." << endl);
[1f1b23]1102 status = false;
1103 }
1104
1105 return status;
1106}
1107;
1108
[35b698]1109bool CheckAdjacencyFileAgainstMolecule_Init(std::string &path, ifstream &File, int *&CurrentBonds)
[ba4170]1110{
[35b698]1111 string filename;
1112 filename = path + ADJACENCYFILE;
1113 File.open(filename.c_str(), ios::out);
[0de7e8]1114 DoLog(1) && (Log() << Verbose(1) << "Looking at bond structure stored in adjacency file and comparing to present one ... " << endl);
[35b698]1115 if (File.fail())
[ba4170]1116 return false;
1117
1118 // allocate storage structure
[920c70]1119 CurrentBonds = new int[8]; // contains parsed bonds of current atom
1120 for(int i=0;i<8;i++)
1121 CurrentBonds[i] = 0;
[ba4170]1122 return true;
[9eefda]1123}
1124;
[ba4170]1125
[e138de]1126void CheckAdjacencyFileAgainstMolecule_Finalize(ifstream &File, int *&CurrentBonds)
[ba4170]1127{
1128 File.close();
1129 File.clear();
[920c70]1130 delete[](CurrentBonds);
[9eefda]1131}
1132;
[ba4170]1133
[e138de]1134void CheckAdjacencyFileAgainstMolecule_CompareBonds(bool &status, int &NonMatchNumber, atom *&Walker, size_t &CurrentBondsOfAtom, int AtomNr, int *&CurrentBonds, atom **ListOfAtoms)
[ba4170]1135{
1136 size_t j = 0;
1137 int id = -1;
1138
[e138de]1139 //Log() << Verbose(2) << "Walker is " << *Walker << ", bond partners: ";
[ba4170]1140 if (CurrentBondsOfAtom == Walker->ListOfBonds.size()) {
1141 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1142 id = (*Runner)->GetOtherAtom(Walker)->nr;
1143 j = 0;
[9eefda]1144 for (; (j < CurrentBondsOfAtom) && (CurrentBonds[j++] != id);)
[ba4170]1145 ; // check against all parsed bonds
[9eefda]1146 if (CurrentBonds[j - 1] != id) { // no match ? Then mark in ListOfAtoms
[ba4170]1147 ListOfAtoms[AtomNr] = NULL;
1148 NonMatchNumber++;
1149 status = false;
[0de7e8]1150 DoeLog(2) && (eLog() << Verbose(2) << id << " can not be found in list." << endl);
[ba4170]1151 } else {
[0de7e8]1152 //Log() << Verbose(0) << "[" << id << "]\t";
[ba4170]1153 }
1154 }
[e138de]1155 //Log() << Verbose(0) << endl;
[ba4170]1156 } else {
[a67d19]1157 DoLog(0) && (Log() << Verbose(0) << "Number of bonds for Atom " << *Walker << " does not match, parsed " << CurrentBondsOfAtom << " against " << Walker->ListOfBonds.size() << "." << endl);
[ba4170]1158 status = false;
1159 }
[9eefda]1160}
1161;
[ba4170]1162
[cee0b57]1163/** Checks contents of adjacency file against bond structure in structure molecule.
1164 * \param *out output stream for debugging
1165 * \param *path path to file
1166 * \param **ListOfAtoms allocated (molecule::AtomCount) and filled lookup table for ids (Atom::nr) to *Atom
1167 * \return true - structure is equal, false - not equivalence
1168 */
[35b698]1169bool molecule::CheckAdjacencyFileAgainstMolecule(std::string &path, atom **ListOfAtoms)
[cee0b57]1170{
1171 ifstream File;
1172 bool status = true;
[266237]1173 atom *Walker = NULL;
[ba4170]1174 int *CurrentBonds = NULL;
[9eefda]1175 int NonMatchNumber = 0; // will number of atoms with differing bond structure
[ba4170]1176 size_t CurrentBondsOfAtom = -1;
[0de7e8]1177 const int AtomCount = getAtomCount();
[cee0b57]1178
[e138de]1179 if (!CheckAdjacencyFileAgainstMolecule_Init(path, File, CurrentBonds)) {
[a67d19]1180 DoLog(1) && (Log() << Verbose(1) << "Adjacency file not found." << endl);
[ba4170]1181 return true;
1182 }
1183
[920c70]1184 char buffer[MAXSTRINGSIZE];
[ba4170]1185 // Parse the file line by line and count the bonds
1186 while (!File.eof()) {
1187 File.getline(buffer, MAXSTRINGSIZE);
1188 stringstream line;
1189 line.str(buffer);
1190 int AtomNr = -1;
1191 line >> AtomNr;
1192 CurrentBondsOfAtom = -1; // we count one too far due to line end
1193 // parse into structure
[0de7e8]1194 if ((AtomNr >= 0) && (AtomNr < AtomCount)) {
[ba4170]1195 Walker = ListOfAtoms[AtomNr];
1196 while (!line.eof())
[9eefda]1197 line >> CurrentBonds[++CurrentBondsOfAtom];
[ba4170]1198 // compare against present bonds
[e138de]1199 CheckAdjacencyFileAgainstMolecule_CompareBonds(status, NonMatchNumber, Walker, CurrentBondsOfAtom, AtomNr, CurrentBonds, ListOfAtoms);
[0de7e8]1200 } else {
1201 if (AtomNr != -1)
1202 DoeLog(2) && (eLog() << Verbose(2) << AtomNr << " is not valid in the range of ids [" << 0 << "," << AtomCount << ")." << endl);
[ba4170]1203 }
[cee0b57]1204 }
[e138de]1205 CheckAdjacencyFileAgainstMolecule_Finalize(File, CurrentBonds);
[cee0b57]1206
[ba4170]1207 if (status) { // if equal we parse the KeySetFile
[a67d19]1208 DoLog(1) && (Log() << Verbose(1) << "done: Equal." << endl);
[ba4170]1209 } else
[a67d19]1210 DoLog(1) && (Log() << Verbose(1) << "done: Not equal by " << NonMatchNumber << " atoms." << endl);
[cee0b57]1211 return status;
[9eefda]1212}
1213;
[cee0b57]1214
1215/** Picks from a global stack with all back edges the ones in the fragment.
1216 * \param *out output stream for debugging
1217 * \param **ListOfLocalAtoms array of father atom::nr to local atom::nr (reverse of atom::father)
1218 * \param *ReferenceStack stack with all the back egdes
1219 * \param *LocalStack stack to be filled
1220 * \return true - everything ok, false - ReferenceStack was empty
1221 */
[e138de]1222bool molecule::PickLocalBackEdges(atom **ListOfLocalAtoms, class StackClass<bond *> *&ReferenceStack, class StackClass<bond *> *&LocalStack) const
[cee0b57]1223{
1224 bool status = true;
1225 if (ReferenceStack->IsEmpty()) {
[a67d19]1226 DoLog(1) && (Log() << Verbose(1) << "ReferenceStack is empty!" << endl);
[cee0b57]1227 return false;
1228 }
1229 bond *Binder = ReferenceStack->PopFirst();
[9eefda]1230 bond *FirstBond = Binder; // mark the first bond, so that we don't loop through the stack indefinitely
[cee0b57]1231 atom *Walker = NULL, *OtherAtom = NULL;
1232 ReferenceStack->Push(Binder);
1233
[9eefda]1234 do { // go through all bonds and push local ones
1235 Walker = ListOfLocalAtoms[Binder->leftatom->nr]; // get one atom in the reference molecule
[cee0b57]1236 if (Walker != NULL) // if this Walker exists in the subgraph ...
[266237]1237 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1238 OtherAtom = (*Runner)->GetOtherAtom(Walker);
1239 if (OtherAtom == ListOfLocalAtoms[(*Runner)->rightatom->nr]) { // found the bond
1240 LocalStack->Push((*Runner));
[a67d19]1241 DoLog(3) && (Log() << Verbose(3) << "Found local edge " << *(*Runner) << "." << endl);
[cee0b57]1242 break;
1243 }
1244 }
[9eefda]1245 Binder = ReferenceStack->PopFirst(); // loop the stack for next item
[a67d19]1246 DoLog(3) && (Log() << Verbose(3) << "Current candidate edge " << Binder << "." << endl);
[cee0b57]1247 ReferenceStack->Push(Binder);
1248 } while (FirstBond != Binder);
1249
1250 return status;
[9eefda]1251}
1252;
[ce7cc5]1253
1254void BreadthFirstSearchAdd_Init(struct BFSAccounting &BFS, atom *&Root, int AtomCount, int BondOrder, atom **AddedAtomList = NULL)
1255{
1256 BFS.AtomCount = AtomCount;
1257 BFS.BondOrder = BondOrder;
[920c70]1258 BFS.PredecessorList = new atom*[AtomCount];
1259 BFS.ShortestPathList = new int[AtomCount];
1260 BFS.ColorList = new enum Shading[AtomCount];
[9eefda]1261 BFS.BFSStack = new StackClass<atom *> (AtomCount);
[ce7cc5]1262
1263 BFS.Root = Root;
[9eefda]1264 BFS.BFSStack->ClearStack();
1265 BFS.BFSStack->Push(Root);
[ce7cc5]1266
1267 // initialise each vertex as white with no predecessor, empty queue, color Root lightgray
[9eefda]1268 for (int i = AtomCount; i--;) {
[920c70]1269 BFS.PredecessorList[i] = NULL;
[ce7cc5]1270 BFS.ShortestPathList[i] = -1;
1271 if ((AddedAtomList != NULL) && (AddedAtomList[i] != NULL)) // mark already present atoms (i.e. Root and maybe others) as visited
1272 BFS.ColorList[i] = lightgray;
1273 else
1274 BFS.ColorList[i] = white;
1275 }
[920c70]1276 //BFS.ShortestPathList[Root->nr] = 0; // done by Calloc
[9eefda]1277}
1278;
[ce7cc5]1279
1280void BreadthFirstSearchAdd_Free(struct BFSAccounting &BFS)
1281{
[920c70]1282 delete[](BFS.PredecessorList);
1283 delete[](BFS.ShortestPathList);
1284 delete[](BFS.ColorList);
[9eefda]1285 delete (BFS.BFSStack);
[ce7cc5]1286 BFS.AtomCount = 0;
[9eefda]1287}
1288;
[ce7cc5]1289
[e138de]1290void BreadthFirstSearchAdd_UnvisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
[ce7cc5]1291{
1292 if (Binder != Bond) // let other atom white if it's via Root bond. In case it's cyclic it has to be reached again (yet Root is from OtherAtom already black, thus no problem)
1293 BFS.ColorList[OtherAtom->nr] = lightgray;
[9eefda]1294 BFS.PredecessorList[OtherAtom->nr] = Walker; // Walker is the predecessor
1295 BFS.ShortestPathList[OtherAtom->nr] = BFS.ShortestPathList[Walker->nr] + 1;
[68f03d]1296 DoLog(2) && (Log() << Verbose(2) << "Coloring OtherAtom " << OtherAtom->getName() << " " << ((BFS.ColorList[OtherAtom->nr] == white) ? "white" : "lightgray") << ", its predecessor is " << Walker->getName() << " and its Shortest Path is " << BFS.ShortestPathList[OtherAtom->nr] << " egde(s) long." << endl);
[9eefda]1297 if ((((BFS.ShortestPathList[OtherAtom->nr] < BFS.BondOrder) && (Binder != Bond)))) { // Check for maximum distance
[a67d19]1298 DoLog(3) && (Log() << Verbose(3));
[ce7cc5]1299 if (AddedAtomList[OtherAtom->nr] == NULL) { // add if it's not been so far
1300 AddedAtomList[OtherAtom->nr] = Mol->AddCopyAtom(OtherAtom);
[68f03d]1301 DoLog(0) && (Log() << Verbose(0) << "Added OtherAtom " << OtherAtom->getName());
[ce7cc5]1302 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
[a67d19]1303 DoLog(0) && (Log() << Verbose(0) << " and bond " << *(AddedBondList[Binder->nr]) << ", ");
[9eefda]1304 } else { // this code should actually never come into play (all white atoms are not yet present in BondMolecule, that's why they are white in the first place)
[68f03d]1305 DoLog(0) && (Log() << Verbose(0) << "Not adding OtherAtom " << OtherAtom->getName());
[ce7cc5]1306 if (AddedBondList[Binder->nr] == NULL) {
1307 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
[a67d19]1308 DoLog(0) && (Log() << Verbose(0) << ", added Bond " << *(AddedBondList[Binder->nr]));
[ce7cc5]1309 } else
[a67d19]1310 DoLog(0) && (Log() << Verbose(0) << ", not added Bond ");
[ce7cc5]1311 }
[a67d19]1312 DoLog(0) && (Log() << Verbose(0) << ", putting OtherAtom into queue." << endl);
[9eefda]1313 BFS.BFSStack->Push(OtherAtom);
[ce7cc5]1314 } else { // out of bond order, then replace
1315 if ((AddedAtomList[OtherAtom->nr] == NULL) && (Binder->Cyclic))
1316 BFS.ColorList[OtherAtom->nr] = white; // unmark if it has not been queued/added, to make it available via its other bonds (cyclic)
1317 if (Binder == Bond)
[a67d19]1318 DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is the Root bond");
[ce7cc5]1319 else if (BFS.ShortestPathList[OtherAtom->nr] >= BFS.BondOrder)
[a67d19]1320 DoLog(3) && (Log() << Verbose(3) << "Not Queueing, is out of Bond Count of " << BFS.BondOrder);
[ce7cc5]1321 if (!Binder->Cyclic)
[a67d19]1322 DoLog(0) && (Log() << Verbose(0) << ", is not part of a cyclic bond, saturating bond with Hydrogen." << endl);
[ce7cc5]1323 if (AddedBondList[Binder->nr] == NULL) {
1324 if ((AddedAtomList[OtherAtom->nr] != NULL)) { // .. whether we add or saturate
1325 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
1326 } else {
[9eefda]1327#ifdef ADDHYDROGEN
[e138de]1328 if (!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
[9eefda]1329 exit(1);
1330#endif
[ce7cc5]1331 }
1332 }
1333 }
[9eefda]1334}
1335;
[ce7cc5]1336
[e138de]1337void BreadthFirstSearchAdd_VisitedNode(molecule *Mol, struct BFSAccounting &BFS, atom *&Walker, atom *&OtherAtom, bond *&Binder, bond *&Bond, atom **&AddedAtomList, bond **&AddedBondList, bool IsAngstroem)
[ce7cc5]1338{
[a67d19]1339 DoLog(3) && (Log() << Verbose(3) << "Not Adding, has already been visited." << endl);
[ce7cc5]1340 // This has to be a cyclic bond, check whether it's present ...
1341 if (AddedBondList[Binder->nr] == NULL) {
[9eefda]1342 if ((Binder != Bond) && (Binder->Cyclic) && (((BFS.ShortestPathList[Walker->nr] + 1) < BFS.BondOrder))) {
[ce7cc5]1343 AddedBondList[Binder->nr] = Mol->CopyBond(AddedAtomList[Walker->nr], AddedAtomList[OtherAtom->nr], Binder);
1344 } else { // if it's root bond it has to broken (otherwise we would not create the fragments)
[9eefda]1345#ifdef ADDHYDROGEN
[e138de]1346 if(!Mol->AddHydrogenReplacementAtom(Binder, AddedAtomList[Walker->nr], Walker, OtherAtom, IsAngstroem))
[9eefda]1347 exit(1);
1348#endif
[ce7cc5]1349 }
1350 }
[9eefda]1351}
1352;
[cee0b57]1353
1354/** Adds atoms up to \a BondCount distance from \a *Root and notes them down in \a **AddedAtomList.
1355 * Gray vertices are always enqueued in an StackClass<atom *> FIFO queue, the rest is usual BFS with adding vertices found was
1356 * white and putting into queue.
1357 * \param *out output stream for debugging
1358 * \param *Mol Molecule class to add atoms to
1359 * \param **AddedAtomList list with added atom pointers, index is atom father's number
1360 * \param **AddedBondList list with added bond pointers, index is bond father's number
1361 * \param *Root root vertex for BFS
1362 * \param *Bond bond not to look beyond
1363 * \param BondOrder maximum distance for vertices to add
1364 * \param IsAngstroem lengths are in angstroem or bohrradii
1365 */
[e138de]1366void molecule::BreadthFirstSearchAdd(molecule *Mol, atom **&AddedAtomList, bond **&AddedBondList, atom *Root, bond *Bond, int BondOrder, bool IsAngstroem)
[cee0b57]1367{
[ce7cc5]1368 struct BFSAccounting BFS;
[cee0b57]1369 atom *Walker = NULL, *OtherAtom = NULL;
[ce7cc5]1370 bond *Binder = NULL;
[cee0b57]1371
1372 // add Root if not done yet
[9eefda]1373 if (AddedAtomList[Root->nr] == NULL) // add Root if not yet present
[cee0b57]1374 AddedAtomList[Root->nr] = Mol->AddCopyAtom(Root);
1375
[ea7176]1376 BreadthFirstSearchAdd_Init(BFS, Root, BondOrder, getAtomCount(), AddedAtomList);
[cee0b57]1377
1378 // and go on ... Queue always contains all lightgray vertices
[9eefda]1379 while (!BFS.BFSStack->IsEmpty()) {
[cee0b57]1380 // we have to pop the oldest atom from stack. This keeps the atoms on the stack always of the same ShortestPath distance.
1381 // e.g. if current atom is 2, push to end of stack are of length 3, but first all of length 2 would be popped. They again
1382 // append length of 3 (their neighbours). Thus on stack we have always atoms of a certain length n at bottom of stack and
1383 // followed by n+1 till top of stack.
[9eefda]1384 Walker = BFS.BFSStack->PopFirst(); // pop oldest added
[68f03d]1385 DoLog(1) && (Log() << Verbose(1) << "Current Walker is: " << Walker->getName() << ", and has " << Walker->ListOfBonds.size() << " bonds." << endl);
[266237]1386 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1387 if ((*Runner) != NULL) { // don't look at bond equal NULL
[ce7cc5]1388 Binder = (*Runner);
[266237]1389 OtherAtom = (*Runner)->GetOtherAtom(Walker);
[68f03d]1390 DoLog(2) && (Log() << Verbose(2) << "Current OtherAtom is: " << OtherAtom->getName() << " for bond " << *(*Runner) << "." << endl);
[ce7cc5]1391 if (BFS.ColorList[OtherAtom->nr] == white) {
[e138de]1392 BreadthFirstSearchAdd_UnvisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
[cee0b57]1393 } else {
[e138de]1394 BreadthFirstSearchAdd_VisitedNode(Mol, BFS, Walker, OtherAtom, Binder, Bond, AddedAtomList, AddedBondList, IsAngstroem);
[cee0b57]1395 }
1396 }
1397 }
[ce7cc5]1398 BFS.ColorList[Walker->nr] = black;
[68f03d]1399 DoLog(1) && (Log() << Verbose(1) << "Coloring Walker " << Walker->getName() << " black." << endl);
[cee0b57]1400 }
[ce7cc5]1401 BreadthFirstSearchAdd_Free(BFS);
[9eefda]1402}
1403;
[cee0b57]1404
[266237]1405/** Adds a bond as a copy to a given one
1406 * \param *left leftatom of new bond
1407 * \param *right rightatom of new bond
1408 * \param *CopyBond rest of fields in bond are copied from this
1409 * \return pointer to new bond
1410 */
1411bond * molecule::CopyBond(atom *left, atom *right, bond *CopyBond)
1412{
1413 bond *Binder = AddBond(left, right, CopyBond->BondDegree);
1414 Binder->Cyclic = CopyBond->Cyclic;
1415 Binder->Type = CopyBond->Type;
1416 return Binder;
[9eefda]1417}
1418;
[266237]1419
[e138de]1420void BuildInducedSubgraph_Init(atom **&ParentList, int AtomCount)
[cee0b57]1421{
1422 // reset parent list
[920c70]1423 ParentList = new atom*[AtomCount];
1424 for (int i=0;i<AtomCount;i++)
1425 ParentList[i] = NULL;
[a67d19]1426 DoLog(3) && (Log() << Verbose(3) << "Resetting ParentList." << endl);
[9eefda]1427}
1428;
[cee0b57]1429
[e138de]1430void BuildInducedSubgraph_FillParentList(const molecule *mol, const molecule *Father, atom **&ParentList)
[43587e]1431{
[cee0b57]1432 // fill parent list with sons
[a67d19]1433 DoLog(3) && (Log() << Verbose(3) << "Filling Parent List." << endl);
[9879f6]1434 for (molecule::const_iterator iter = mol->begin(); iter != mol->end(); ++iter) {
1435 ParentList[(*iter)->father->nr] = (*iter);
[cee0b57]1436 // Outputting List for debugging
[a7b761b]1437 DoLog(4) && (Log() << Verbose(4) << "Son[" << (*iter)->father->nr << "] of " << (*iter)->father << " is " << ParentList[(*iter)->father->nr] << "." << endl);
[cee0b57]1438 }
[a7b761b]1439};
[43587e]1440
[e138de]1441void BuildInducedSubgraph_Finalize(atom **&ParentList)
[43587e]1442{
[920c70]1443 delete[](ParentList);
[9eefda]1444}
1445;
[43587e]1446
[e138de]1447bool BuildInducedSubgraph_CreateBondsFromParent(molecule *mol, const molecule *Father, atom **&ParentList)
[43587e]1448{
1449 bool status = true;
1450 atom *OtherAtom = NULL;
[cee0b57]1451 // check each entry of parent list and if ok (one-to-and-onto matching) create bonds
[a67d19]1452 DoLog(3) && (Log() << Verbose(3) << "Creating bonds." << endl);
[9879f6]1453 for (molecule::const_iterator iter = Father->begin(); iter != Father->end(); ++iter) {
1454 if (ParentList[(*iter)->nr] != NULL) {
1455 if (ParentList[(*iter)->nr]->father != (*iter)) {
[cee0b57]1456 status = false;
1457 } else {
[9879f6]1458 for (BondList::const_iterator Runner = (*iter)->ListOfBonds.begin(); Runner != (*iter)->ListOfBonds.end(); (++Runner)) {
1459 OtherAtom = (*Runner)->GetOtherAtom((*iter));
[cee0b57]1460 if (ParentList[OtherAtom->nr] != NULL) { // if otheratom is also a father of an atom on this molecule, create the bond
[a7b761b]1461 DoLog(4) && (Log() << Verbose(4) << "Endpoints of Bond " << (*Runner) << " are both present: " << ParentList[(*iter)->nr]->getName() << " and " << ParentList[OtherAtom->nr]->getName() << "." << endl);
[9879f6]1462 mol->AddBond(ParentList[(*iter)->nr], ParentList[OtherAtom->nr], (*Runner)->BondDegree);
[cee0b57]1463 }
1464 }
1465 }
1466 }
1467 }
[43587e]1468 return status;
[9eefda]1469}
1470;
[cee0b57]1471
[43587e]1472/** Adds bond structure to this molecule from \a Father molecule.
1473 * This basically causes this molecule to become an induced subgraph of the \a Father, i.e. for every bond in Father
1474 * with end points present in this molecule, bond is created in this molecule.
1475 * Special care was taken to ensure that this is of complexity O(N), where N is the \a Father's molecule::AtomCount.
1476 * \param *out output stream for debugging
1477 * \param *Father father molecule
1478 * \return true - is induced subgraph, false - there are atoms with fathers not in \a Father
1479 * \todo not checked, not fully working probably
1480 */
[e138de]1481bool molecule::BuildInducedSubgraph(const molecule *Father)
[43587e]1482{
1483 bool status = true;
1484 atom **ParentList = NULL;
[a67d19]1485 DoLog(2) && (Log() << Verbose(2) << "Begin of BuildInducedSubgraph." << endl);
[ea7176]1486 BuildInducedSubgraph_Init(ParentList, Father->getAtomCount());
[e138de]1487 BuildInducedSubgraph_FillParentList(this, Father, ParentList);
1488 status = BuildInducedSubgraph_CreateBondsFromParent(this, Father, ParentList);
1489 BuildInducedSubgraph_Finalize(ParentList);
[a67d19]1490 DoLog(2) && (Log() << Verbose(2) << "End of BuildInducedSubgraph." << endl);
[cee0b57]1491 return status;
[9eefda]1492}
1493;
[cee0b57]1494
1495/** For a given keyset \a *Fragment, checks whether it is connected in the current molecule.
1496 * \param *out output stream for debugging
1497 * \param *Fragment Keyset of fragment's vertices
1498 * \return true - connected, false - disconnected
1499 * \note this is O(n^2) for it's just a bug checker not meant for permanent use!
1500 */
[e138de]1501bool molecule::CheckForConnectedSubgraph(KeySet *Fragment)
[cee0b57]1502{
1503 atom *Walker = NULL, *Walker2 = NULL;
1504 bool BondStatus = false;
1505 int size;
1506
[a67d19]1507 DoLog(1) && (Log() << Verbose(1) << "Begin of CheckForConnectedSubgraph" << endl);
1508 DoLog(2) && (Log() << Verbose(2) << "Disconnected atom: ");
[cee0b57]1509
1510 // count number of atoms in graph
1511 size = 0;
[9eefda]1512 for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++)
[cee0b57]1513 size++;
1514 if (size > 1)
[9eefda]1515 for (KeySet::iterator runner = Fragment->begin(); runner != Fragment->end(); runner++) {
[cee0b57]1516 Walker = FindAtom(*runner);
1517 BondStatus = false;
[9eefda]1518 for (KeySet::iterator runners = Fragment->begin(); runners != Fragment->end(); runners++) {
[cee0b57]1519 Walker2 = FindAtom(*runners);
[266237]1520 for (BondList::const_iterator Runner = Walker->ListOfBonds.begin(); Runner != Walker->ListOfBonds.end(); (++Runner)) {
1521 if ((*Runner)->GetOtherAtom(Walker) == Walker2) {
[cee0b57]1522 BondStatus = true;
1523 break;
1524 }
1525 if (BondStatus)
1526 break;
1527 }
1528 }
1529 if (!BondStatus) {
[a67d19]1530 DoLog(0) && (Log() << Verbose(0) << (*Walker) << endl);
[cee0b57]1531 return false;
1532 }
1533 }
1534 else {
[a67d19]1535 DoLog(0) && (Log() << Verbose(0) << "none." << endl);
[cee0b57]1536 return true;
1537 }
[a67d19]1538 DoLog(0) && (Log() << Verbose(0) << "none." << endl);
[cee0b57]1539
[a67d19]1540 DoLog(1) && (Log() << Verbose(1) << "End of CheckForConnectedSubgraph" << endl);
[cee0b57]1541
1542 return true;
1543}
Note: See TracBrowser for help on using the repository browser.