source: src/molecule_fragmentation.cpp@ a479fa

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since a479fa was a479fa, checked in by Frederik Heber <heber@…>, 14 years ago

Renamed ParticleInfo::nr to ParticleInfo::ParticleInfo_nr for easier privatization.

  • Property mode set to 100644
File size: 83.2 KB
RevLine 
[bcf653]1/*
2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2010 University of Bonn. All rights reserved.
5 * Please see the LICENSE file or "Copyright notice" in builder.cpp for details.
6 */
7
[cee0b57]8/*
9 * molecule_fragmentation.cpp
10 *
11 * Created on: Oct 5, 2009
12 * Author: heber
13 */
14
[bf3817]15// include config.h
16#ifdef HAVE_CONFIG_H
17#include <config.h>
18#endif
19
[ad011c]20#include "CodePatterns/MemDebug.hpp"
[112b09]21
[49e1ae]22#include <cstring>
23
[cbc5fb]24#include "World.hpp"
[f66195]25#include "atom.hpp"
26#include "bond.hpp"
[cee0b57]27#include "config.hpp"
[f66195]28#include "element.hpp"
[952f38]29#include "Helpers/helpers.hpp"
[ad011c]30#include "CodePatterns/Verbose.hpp"
31#include "CodePatterns/Log.hpp"
[cee0b57]32#include "molecule.hpp"
[f66195]33#include "periodentafel.hpp"
[b34306]34#include "World.hpp"
[cca9ef]35#include "LinearAlgebra/RealSpaceMatrix.hpp"
[84c494]36#include "Box.hpp"
[cee0b57]37
38/************************************* Functions for class molecule *********************************/
39
40
41/** Estimates by educated guessing (using upper limit) the expected number of fragments.
42 * The upper limit is
43 * \f[
44 * n = N \cdot C^k
45 * \f]
46 * where \f$C=2^c\f$ and c is the maximum bond degree over N number of atoms.
47 * \param *out output stream for debugging
48 * \param order bond order k
49 * \return number n of fragments
50 */
[e138de]51int molecule::GuesstimateFragmentCount(int order)
[cee0b57]52{
[266237]53 size_t c = 0;
[cee0b57]54 int FragmentCount;
55 // get maximum bond degree
[9879f6]56 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[9d83b6]57 const BondList& ListOfBonds = (*iter)->getListOfBonds();
58 c = (ListOfBonds.size() > c) ? ListOfBonds.size() : c;
[cee0b57]59 }
60 FragmentCount = NoNonHydrogen*(1 << (c*order));
[a67d19]61 DoLog(1) && (Log() << Verbose(1) << "Upper limit for this subgraph is " << FragmentCount << " for " << NoNonHydrogen << " non-H atoms with maximum bond degree of " << c << "." << endl);
[cee0b57]62 return FragmentCount;
63};
64
65/** Scans a single line for number and puts them into \a KeySet.
66 * \param *out output stream for debugging
67 * \param *buffer buffer to scan
68 * \param &CurrentSet filled KeySet on return
69 * \return true - at least one valid atom id parsed, false - CurrentSet is empty
70 */
[e138de]71bool ScanBufferIntoKeySet(char *buffer, KeySet &CurrentSet)
[cee0b57]72{
73 stringstream line;
74 int AtomNr;
75 int status = 0;
76
77 line.str(buffer);
78 while (!line.eof()) {
79 line >> AtomNr;
[5034e1]80 if (AtomNr >= 0) {
[cee0b57]81 CurrentSet.insert(AtomNr); // insert at end, hence in same order as in file!
82 status++;
83 } // else it's "-1" or else and thus must not be added
84 }
[a67d19]85 DoLog(1) && (Log() << Verbose(1) << "The scanned KeySet is ");
[cee0b57]86 for(KeySet::iterator runner = CurrentSet.begin(); runner != CurrentSet.end(); runner++) {
[a67d19]87 DoLog(0) && (Log() << Verbose(0) << (*runner) << "\t");
[cee0b57]88 }
[a67d19]89 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]90 return (status != 0);
91};
92
93/** Parses the KeySet file and fills \a *FragmentList from the known molecule structure.
94 * Does two-pass scanning:
95 * -# Scans the keyset file and initialises a temporary graph
96 * -# Scans TEFactors file and sets the TEFactor of each key set in the temporary graph accordingly
97 * Finally, the temporary graph is inserted into the given \a FragmentList for return.
[35b698]98 * \param &path path to file
[cee0b57]99 * \param *FragmentList empty, filled on return
100 * \return true - parsing successfully, false - failure on parsing (FragmentList will be NULL)
101 */
[35b698]102bool ParseKeySetFile(std::string &path, Graph *&FragmentList)
[cee0b57]103{
104 bool status = true;
105 ifstream InputFile;
106 stringstream line;
107 GraphTestPair testGraphInsert;
108 int NumberOfFragments = 0;
[35b698]109 string filename;
[cee0b57]110
111 if (FragmentList == NULL) { // check list pointer
112 FragmentList = new Graph;
113 }
114
115 // 1st pass: open file and read
[a67d19]116 DoLog(1) && (Log() << Verbose(1) << "Parsing the KeySet file ... " << endl);
[35b698]117 filename = path + KEYSETFILE;
118 InputFile.open(filename.c_str());
119 if (InputFile.good()) {
[cee0b57]120 // each line represents a new fragment
[920c70]121 char buffer[MAXSTRINGSIZE];
[cee0b57]122 // 1. parse keysets and insert into temp. graph
123 while (!InputFile.eof()) {
124 InputFile.getline(buffer, MAXSTRINGSIZE);
125 KeySet CurrentSet;
[e138de]126 if ((strlen(buffer) > 0) && (ScanBufferIntoKeySet(buffer, CurrentSet))) { // if at least one valid atom was added, write config
[cee0b57]127 testGraphInsert = FragmentList->insert(GraphPair (CurrentSet,pair<int,double>(NumberOfFragments++,1))); // store fragment number and current factor
128 if (!testGraphInsert.second) {
[58ed4a]129 DoeLog(0) && (eLog()<< Verbose(0) << "KeySet file must be corrupt as there are two equal key sets therein!" << endl);
[e359a8]130 performCriticalExit();
[cee0b57]131 }
132 }
133 }
134 // 2. Free and done
135 InputFile.close();
136 InputFile.clear();
[0de7e8]137 DoLog(1) && (Log() << Verbose(1) << "\t ... done." << endl);
[cee0b57]138 } else {
[0de7e8]139 DoLog(1) && (Log() << Verbose(1) << "\t ... File " << filename << " not found." << endl);
[cee0b57]140 status = false;
141 }
142
[5034e1]143 return status;
144};
145
146/** Parses the TE factors file and fills \a *FragmentList from the known molecule structure.
147 * -# Scans TEFactors file and sets the TEFactor of each key set in the temporary graph accordingly
148 * \param *out output stream for debugging
149 * \param *path path to file
150 * \param *FragmentList graph whose nodes's TE factors are set on return
151 * \return true - parsing successfully, false - failure on parsing
152 */
[e138de]153bool ParseTEFactorsFile(char *path, Graph *FragmentList)
[5034e1]154{
155 bool status = true;
156 ifstream InputFile;
157 stringstream line;
158 GraphTestPair testGraphInsert;
159 int NumberOfFragments = 0;
160 double TEFactor;
[920c70]161 char filename[MAXSTRINGSIZE];
[5034e1]162
163 if (FragmentList == NULL) { // check list pointer
164 FragmentList = new Graph;
165 }
166
[cee0b57]167 // 2nd pass: open TEFactors file and read
[a67d19]168 DoLog(1) && (Log() << Verbose(1) << "Parsing the TEFactors file ... " << endl);
[cee0b57]169 sprintf(filename, "%s/%s%s", path, FRAGMENTPREFIX, TEFACTORSFILE);
170 InputFile.open(filename);
171 if (InputFile != NULL) {
172 // 3. add found TEFactors to each keyset
173 NumberOfFragments = 0;
174 for(Graph::iterator runner = FragmentList->begin();runner != FragmentList->end(); runner++) {
175 if (!InputFile.eof()) {
176 InputFile >> TEFactor;
177 (*runner).second.second = TEFactor;
[a67d19]178 DoLog(2) && (Log() << Verbose(2) << "Setting " << ++NumberOfFragments << " fragment's TEFactor to " << (*runner).second.second << "." << endl);
[cee0b57]179 } else {
180 status = false;
181 break;
182 }
183 }
184 // 4. Free and done
185 InputFile.close();
[a67d19]186 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]187 } else {
[a67d19]188 DoLog(1) && (Log() << Verbose(1) << "File " << filename << " not found." << endl);
[cee0b57]189 status = false;
190 }
191
192 return status;
193};
194
[5034e1]195/** Stores key sets to file.
196 * \param KeySetList Graph with Keysets
[35b698]197 * \param &path path to file
[cee0b57]198 * \return true - file written successfully, false - writing failed
199 */
[35b698]200bool StoreKeySetFile(Graph &KeySetList, std::string &path)
[cee0b57]201{
202 bool status = true;
[35b698]203 string line = path + KEYSETFILE;
204 ofstream output(line.c_str());
[cee0b57]205
206 // open KeySet file
[a67d19]207 DoLog(1) && (Log() << Verbose(1) << "Saving key sets of the total graph ... ");
[35b698]208 if(output.good()) {
[cee0b57]209 for(Graph::iterator runner = KeySetList.begin(); runner != KeySetList.end(); runner++) {
210 for (KeySet::iterator sprinter = (*runner).first.begin();sprinter != (*runner).first.end(); sprinter++) {
211 if (sprinter != (*runner).first.begin())
212 output << "\t";
213 output << *sprinter;
214 }
215 output << endl;
216 }
[a67d19]217 DoLog(0) && (Log() << Verbose(0) << "done." << endl);
[cee0b57]218 } else {
[58ed4a]219 DoeLog(0) && (eLog()<< Verbose(0) << "Unable to open " << line << " for writing keysets!" << endl);
[e359a8]220 performCriticalExit();
[cee0b57]221 status = false;
222 }
223 output.close();
224 output.clear();
225
[5034e1]226 return status;
227};
228
229
230/** Stores TEFactors to file.
231 * \param *out output stream for debugging
232 * \param KeySetList Graph with factors
233 * \param *path path to file
234 * \return true - file written successfully, false - writing failed
235 */
[e138de]236bool StoreTEFactorsFile(Graph &KeySetList, char *path)
[5034e1]237{
238 ofstream output;
239 bool status = true;
240 string line;
241
[cee0b57]242 // open TEFactors file
243 line = path;
244 line.append("/");
245 line += FRAGMENTPREFIX;
246 line += TEFACTORSFILE;
247 output.open(line.c_str(), ios::out);
[a67d19]248 DoLog(1) && (Log() << Verbose(1) << "Saving TEFactors of the total graph ... ");
[cee0b57]249 if(output != NULL) {
250 for(Graph::iterator runner = KeySetList.begin(); runner != KeySetList.end(); runner++)
251 output << (*runner).second.second << endl;
[a67d19]252 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]253 } else {
[a67d19]254 DoLog(1) && (Log() << Verbose(1) << "failed to open " << line << "." << endl);
[cee0b57]255 status = false;
256 }
257 output.close();
258
259 return status;
260};
261
[5034e1]262/** For a given graph, sorts KeySets into a (index, keyset) map.
263 * \param *GlobalKeySetList list of keysets with global ids (valid in "this" molecule) needed for adaptive increase
264 * \return map from index to keyset
265 */
266map<int,KeySet> * GraphToIndexedKeySet(Graph *GlobalKeySetList)
267{
268 map<int,KeySet> *IndexKeySetList = new map<int,KeySet>;
269 for(Graph::iterator runner = GlobalKeySetList->begin(); runner != GlobalKeySetList->end(); runner++) {
270 IndexKeySetList->insert( pair<int,KeySet>(runner->second.first,runner->first) );
271 }
272 return IndexKeySetList;
273};
274
275/** Inserts a (\a No, \a value) pair into the list, overwriting present one.
276 * Note if values are equal, No will decided on which is first
277 * \param *out output stream for debugging
278 * \param &AdaptiveCriteriaList list to insert into
279 * \param &IndexedKeySetList list to find key set for a given index \a No
280 * \param FragOrder current bond order of fragment
281 * \param No index of keyset
282 * \param value energy value
283 */
[e138de]284void InsertIntoAdaptiveCriteriaList(map<int, pair<double,int> > *AdaptiveCriteriaList, map<int,KeySet> &IndexKeySetList, int FragOrder, int No, double Value)
[5034e1]285{
286 map<int,KeySet>::iterator marker = IndexKeySetList.find(No); // find keyset to Frag No.
287 if (marker != IndexKeySetList.end()) { // if found
288 Value *= 1 + MYEPSILON*(*((*marker).second.begin())); // in case of equal energies this makes them not equal without changing anything actually
289 // as the smallest number in each set has always been the root (we use global id to keep the doubles away), seek smallest and insert into AtomMask
290 pair <map<int, pair<double,int> >::iterator, bool> InsertedElement = AdaptiveCriteriaList->insert( make_pair(*((*marker).second.begin()), pair<double,int>( fabs(Value), FragOrder) ));
291 map<int, pair<double,int> >::iterator PresentItem = InsertedElement.first;
292 if (!InsertedElement.second) { // this root is already present
293 if ((*PresentItem).second.second < FragOrder) // if order there is lower, update entry with higher-order term
294 //if ((*PresentItem).second.first < (*runner).first) // as higher-order terms are not always better, we skip this part (which would always include this site into adaptive increase)
295 { // if value is smaller, update value and order
296 (*PresentItem).second.first = fabs(Value);
297 (*PresentItem).second.second = FragOrder;
[a67d19]298 DoLog(2) && (Log() << Verbose(2) << "Updated element (" << (*PresentItem).first << ",[" << (*PresentItem).second.first << "," << (*PresentItem).second.second << "])." << endl);
[5034e1]299 } else {
[a67d19]300 DoLog(2) && (Log() << Verbose(2) << "Did not update element " << (*PresentItem).first << " as " << FragOrder << " is less than or equal to " << (*PresentItem).second.second << "." << endl);
[5034e1]301 }
302 } else {
[a67d19]303 DoLog(2) && (Log() << Verbose(2) << "Inserted element (" << (*PresentItem).first << ",[" << (*PresentItem).second.first << "," << (*PresentItem).second.second << "])." << endl);
[5034e1]304 }
305 } else {
[a67d19]306 DoLog(1) && (Log() << Verbose(1) << "No Fragment under No. " << No << "found." << endl);
[5034e1]307 }
308};
309
[a0064e]310/** Counts lines in file.
311 * Note we are scanning lines from current position, not from beginning.
312 * \param InputFile file to be scanned.
313 */
314int CountLinesinFile(ifstream &InputFile)
315{
316 char *buffer = new char[MAXSTRINGSIZE];
317 int lines=0;
318
319 int PositionMarker = InputFile.tellg(); // not needed as Inputfile is copied, given by value, not by ref
320 // count the number of lines, i.e. the number of fragments
321 InputFile.getline(buffer, MAXSTRINGSIZE); // skip comment lines
322 InputFile.getline(buffer, MAXSTRINGSIZE);
323 while(!InputFile.eof()) {
324 InputFile.getline(buffer, MAXSTRINGSIZE);
325 lines++;
326 }
327 InputFile.seekg(PositionMarker, ios::beg);
328 delete[](buffer);
329 return lines;
330};
331
332
[5034e1]333/** Scans the adaptive order file and insert (index, value) into map.
[35b698]334 * \param &path path to ENERGYPERFRAGMENT file (may be NULL if Order is non-negative)
[5034e1]335 * \param &IndexedKeySetList list to find key set for a given index \a No
336 * \return adaptive criteria list from file
337 */
[35b698]338map<int, pair<double,int> > * ScanAdaptiveFileIntoMap(std::string &path, map<int,KeySet> &IndexKeySetList)
[5034e1]339{
340 map<int, pair<double,int> > *AdaptiveCriteriaList = new map<int, pair<double,int> >;
341 int No = 0, FragOrder = 0;
342 double Value = 0.;
[920c70]343 char buffer[MAXSTRINGSIZE];
[35b698]344 string filename = path + ENERGYPERFRAGMENT;
345 ifstream InputFile(filename.c_str());
346
347 if (InputFile.fail()) {
348 DoeLog(1) && (eLog() << Verbose(1) << "Cannot find file " << filename << "." << endl);
349 return AdaptiveCriteriaList;
350 }
[5034e1]351
352 if (CountLinesinFile(InputFile) > 0) {
[a479fa]353 // each line represents a fragment root (Atom::ParticleInfo_nr) id and its energy contribution
[5034e1]354 InputFile.getline(buffer, MAXSTRINGSIZE); // skip comment lines
355 InputFile.getline(buffer, MAXSTRINGSIZE);
356 while(!InputFile.eof()) {
357 InputFile.getline(buffer, MAXSTRINGSIZE);
358 if (strlen(buffer) > 2) {
[e138de]359 //Log() << Verbose(2) << "Scanning: " << buffer << endl;
[5034e1]360 stringstream line(buffer);
361 line >> FragOrder;
362 line >> ws >> No;
363 line >> ws >> Value; // skip time entry
364 line >> ws >> Value;
365 No -= 1; // indices start at 1 in file, not 0
[e138de]366 //Log() << Verbose(2) << " - yields (" << No << "," << Value << ", " << FragOrder << ")" << endl;
[5034e1]367
368 // clean the list of those entries that have been superceded by higher order terms already
[e138de]369 InsertIntoAdaptiveCriteriaList(AdaptiveCriteriaList, IndexKeySetList, FragOrder, No, Value);
[5034e1]370 }
371 }
372 // close and done
373 InputFile.close();
374 InputFile.clear();
375 }
376
377 return AdaptiveCriteriaList;
378};
379
380/** Maps adaptive criteria list back onto (Value, (Root Nr., Order))
381 * (i.e. sorted by value to pick the highest ones)
382 * \param *out output stream for debugging
383 * \param &AdaptiveCriteriaList list to insert into
384 * \param *mol molecule with atoms
385 * \return remapped list
386 */
[e138de]387map<double, pair<int,int> > * ReMapAdaptiveCriteriaListToValue(map<int, pair<double,int> > *AdaptiveCriteriaList, molecule *mol)
[5034e1]388{
[9879f6]389 atom *Walker = NULL;
[5034e1]390 map<double, pair<int,int> > *FinalRootCandidates = new map<double, pair<int,int> > ;
[a67d19]391 DoLog(1) && (Log() << Verbose(1) << "Root candidate list is: " << endl);
[5034e1]392 for(map<int, pair<double,int> >::iterator runner = AdaptiveCriteriaList->begin(); runner != AdaptiveCriteriaList->end(); runner++) {
393 Walker = mol->FindAtom((*runner).first);
394 if (Walker != NULL) {
395 //if ((*runner).second.second >= Walker->AdaptiveOrder) { // only insert if this is an "active" root site for the current order
396 if (!Walker->MaxOrder) {
[a67d19]397 DoLog(2) && (Log() << Verbose(2) << "(" << (*runner).first << ",[" << (*runner).second.first << "," << (*runner).second.second << "])" << endl);
[5034e1]398 FinalRootCandidates->insert( make_pair( (*runner).second.first, pair<int,int>((*runner).first, (*runner).second.second) ) );
399 } else {
[a67d19]400 DoLog(2) && (Log() << Verbose(2) << "Excluding (" << *Walker << ", " << (*runner).first << ",[" << (*runner).second.first << "," << (*runner).second.second << "]), as it has reached its maximum order." << endl);
[5034e1]401 }
402 } else {
[58ed4a]403 DoeLog(0) && (eLog()<< Verbose(0) << "Atom No. " << (*runner).second.first << " was not found in this molecule." << endl);
[e359a8]404 performCriticalExit();
[5034e1]405 }
406 }
407 return FinalRootCandidates;
408};
409
410/** Marks all candidate sites for update if below adaptive threshold.
411 * Picks a given number of highest values and set *AtomMask to true.
412 * \param *out output stream for debugging
[a479fa]413 * \param *AtomMask defines true/false per global Atom::ParticleInfo_nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
[5034e1]414 * \param FinalRootCandidates list candidates to check
415 * \param Order desired order
416 * \param *mol molecule with atoms
417 * \return true - if update is necessary, false - not
418 */
[e138de]419bool MarkUpdateCandidates(bool *AtomMask, map<double, pair<int,int> > &FinalRootCandidates, int Order, molecule *mol)
[5034e1]420{
[9879f6]421 atom *Walker = NULL;
[5034e1]422 int No = -1;
423 bool status = false;
424 for(map<double, pair<int,int> >::iterator runner = FinalRootCandidates.upper_bound(pow(10.,Order)); runner != FinalRootCandidates.end(); runner++) {
425 No = (*runner).second.first;
426 Walker = mol->FindAtom(No);
[a479fa]427 //if (Walker->AdaptiveOrder < MinimumRingSize[Walker->ParticleInfo_nr]) {
[a67d19]428 DoLog(2) && (Log() << Verbose(2) << "Root " << No << " is still above threshold (10^{" << Order <<"}: " << runner->first << ", setting entry " << No << " of Atom mask to true." << endl);
[5034e1]429 AtomMask[No] = true;
430 status = true;
431 //} else
[a479fa]432 //Log() << Verbose(2) << "Root " << No << " is still above threshold (10^{" << Order <<"}: " << runner->first << ", however MinimumRingSize of " << MinimumRingSize[Walker->ParticleInfo_nr] << " does not allow further adaptive increase." << endl;
[5034e1]433 }
434 return status;
435};
436
437/** print atom mask for debugging.
438 * \param *out output stream for debugging
[a479fa]439 * \param *AtomMask defines true/false per global Atom::ParticleInfo_nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
[5034e1]440 * \param AtomCount number of entries in \a *AtomMask
441 */
[e138de]442void PrintAtomMask(bool *AtomMask, int AtomCount)
[5034e1]443{
[a67d19]444 DoLog(2) && (Log() << Verbose(2) << " ");
[5034e1]445 for(int i=0;i<AtomCount;i++)
[a67d19]446 DoLog(0) && (Log() << Verbose(0) << (i % 10));
447 DoLog(0) && (Log() << Verbose(0) << endl);
448 DoLog(2) && (Log() << Verbose(2) << "Atom mask is: ");
[5034e1]449 for(int i=0;i<AtomCount;i++)
[a67d19]450 DoLog(0) && (Log() << Verbose(0) << (AtomMask[i] ? "t" : "f"));
451 DoLog(0) && (Log() << Verbose(0) << endl);
[5034e1]452};
[cee0b57]453
454/** Checks whether the OrderAtSite is still below \a Order at some site.
[a479fa]455 * \param *AtomMask defines true/false per global Atom::ParticleInfo_nr to mask in/out each nuclear site, used to activate given number of site to increment order adaptively
[cee0b57]456 * \param *GlobalKeySetList list of keysets with global ids (valid in "this" molecule) needed for adaptive increase
457 * \param Order desired Order if positive, desired exponent in threshold criteria if negative (0 is single-step)
458 * \param *MinimumRingSize array of max. possible order to avoid loops
[35b698]459 * \param path path to ENERGYPERFRAGMENT file (may be NULL if Order is non-negative)
[cee0b57]460 * \return true - needs further fragmentation, false - does not need fragmentation
461 */
[35b698]462bool molecule::CheckOrderAtSite(bool *AtomMask, Graph *GlobalKeySetList, int Order, int *MinimumRingSize, std::string path)
[cee0b57]463{
464 bool status = false;
465
466 // initialize mask list
[ea7176]467 for(int i=getAtomCount();i--;)
[cee0b57]468 AtomMask[i] = false;
469
470 if (Order < 0) { // adaptive increase of BondOrder per site
[ea7176]471 if (AtomMask[getAtomCount()] == true) // break after one step
[cee0b57]472 return false;
[5034e1]473
474 // transmorph graph keyset list into indexed KeySetList
475 if (GlobalKeySetList == NULL) {
[58ed4a]476 DoeLog(1) && (eLog()<< Verbose(1) << "Given global key set list (graph) is NULL!" << endl);
[5034e1]477 return false;
478 }
479 map<int,KeySet> *IndexKeySetList = GraphToIndexedKeySet(GlobalKeySetList);
480
[cee0b57]481 // parse the EnergyPerFragment file
[e138de]482 map<int, pair<double,int> > *AdaptiveCriteriaList = ScanAdaptiveFileIntoMap(path, *IndexKeySetList); // (Root No., (Value, Order)) !
[5034e1]483 if (AdaptiveCriteriaList->empty()) {
[58ed4a]484 DoeLog(2) && (eLog()<< Verbose(2) << "Unable to parse file, incrementing all." << endl);
[9879f6]485 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[cee0b57]486 #ifdef ADDHYDROGEN
[83f176]487 if ((*iter)->getType()->getAtomicNumber() != 1) // skip hydrogen
[cee0b57]488 #endif
489 {
[a479fa]490 AtomMask[(*iter)->ParticleInfo_nr] = true; // include all (non-hydrogen) atoms
[cee0b57]491 status = true;
492 }
493 }
494 }
[5034e1]495 // then map back onto (Value, (Root Nr., Order)) (i.e. sorted by value to pick the highest ones)
[e138de]496 map<double, pair<int,int> > *FinalRootCandidates = ReMapAdaptiveCriteriaListToValue(AdaptiveCriteriaList, this);
[5034e1]497
498 // pick the ones still below threshold and mark as to be adaptively updated
[e138de]499 MarkUpdateCandidates(AtomMask, *FinalRootCandidates, Order, this);
[5034e1]500
[920c70]501 delete[](IndexKeySetList);
502 delete[](AdaptiveCriteriaList);
503 delete[](FinalRootCandidates);
[cee0b57]504 } else { // global increase of Bond Order
[9879f6]505 for(molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[cee0b57]506 #ifdef ADDHYDROGEN
[83f176]507 if ((*iter)->getType()->getAtomicNumber() != 1) // skip hydrogen
[cee0b57]508 #endif
509 {
[a479fa]510 AtomMask[(*iter)->ParticleInfo_nr] = true; // include all (non-hydrogen) atoms
511 if ((Order != 0) && ((*iter)->AdaptiveOrder < Order)) // && ((*iter)->AdaptiveOrder < MinimumRingSize[(*iter)->ParticleInfo_nr]))
[cee0b57]512 status = true;
513 }
514 }
[ea7176]515 if ((!Order) && (!AtomMask[getAtomCount()])) // single stepping, just check
[cee0b57]516 status = true;
517
518 if (!status) {
519 if (Order == 0)
[a67d19]520 DoLog(1) && (Log() << Verbose(1) << "Single stepping done." << endl);
[cee0b57]521 else
[a67d19]522 DoLog(1) && (Log() << Verbose(1) << "Order at every site is already equal or above desired order " << Order << "." << endl);
[cee0b57]523 }
524 }
525
[ea7176]526 PrintAtomMask(AtomMask, getAtomCount()); // for debugging
[cee0b57]527
528 return status;
529};
530
531/** Create a SortIndex to map from atomic labels to the sequence in which the atoms are given in the config file.
532 * \param *out output stream for debugging
533 * \param *&SortIndex Mapping array of size molecule::AtomCount
534 * \return true - success, false - failure of SortIndex alloc
535 */
[e138de]536bool molecule::CreateMappingLabelsToConfigSequence(int *&SortIndex)
[cee0b57]537{
538 if (SortIndex != NULL) {
[a67d19]539 DoLog(1) && (Log() << Verbose(1) << "SortIndex is " << SortIndex << " and not NULL as expected." << endl);
[cee0b57]540 return false;
541 }
[1024cb]542 SortIndex = new int[getAtomCount()];
[ea7176]543 for(int i=getAtomCount();i--;)
[cee0b57]544 SortIndex[i] = -1;
[5034e1]545
546 int AtomNo = 0;
[32ea56]547 for(internal_iterator iter=atoms.begin();iter!=atoms.end();++iter){
[a479fa]548 ASSERT(SortIndex[(*iter)->ParticleInfo_nr]==-1,"Same SortIndex set twice");
549 SortIndex[(*iter)->ParticleInfo_nr] = AtomNo++;
[32ea56]550 }
[5034e1]551
[cee0b57]552 return true;
553};
554
[9879f6]555
556
557/** Creates a lookup table for true father's Atom::Nr -> atom ptr.
558 * \param *start begin of list (STL iterator, i.e. first item)
559 * \paran *end end of list (STL iterator, i.e. one past last item)
560 * \param **Lookuptable pointer to return allocated lookup table (should be NULL on start)
561 * \param count optional predetermined size for table (otherwise we set the count to highest true father id)
562 * \return true - success, false - failure
563 */
564bool molecule::CreateFatherLookupTable(atom **&LookupTable, int count)
565{
566 bool status = true;
567 int AtomNo;
568
569 if (LookupTable != NULL) {
570 Log() << Verbose(0) << "Pointer for Lookup table is not NULL! Aborting ..." <<endl;
571 return false;
572 }
573
574 // count them
575 if (count == 0) {
[a479fa]576 for (molecule::iterator iter = begin(); iter != end(); ++iter) { // create a lookup table (Atom::ParticleInfo_nr -> atom) used as a marker table lateron
577 count = (count < (*iter)->GetTrueFather()->ParticleInfo_nr) ? (*iter)->GetTrueFather()->ParticleInfo_nr : count;
[9879f6]578 }
579 }
580 if (count <= 0) {
581 Log() << Verbose(0) << "Count of lookup list is 0 or less." << endl;
582 return false;
583 }
584
585 // allocate and fill
[1024cb]586 LookupTable = new atom *[count];
[9879f6]587 if (LookupTable == NULL) {
588 eLog() << Verbose(0) << "LookupTable memory allocation failed!" << endl;
589 performCriticalExit();
590 status = false;
591 } else {
[1024cb]592 for (int i=0;i<count;i++)
593 LookupTable[i] = NULL;
[9879f6]594 for (molecule::iterator iter = begin(); iter != end(); ++iter) {
[a479fa]595 AtomNo = (*iter)->GetTrueFather()->ParticleInfo_nr;
[9879f6]596 if ((AtomNo >= 0) && (AtomNo < count)) {
597 //*out << "Setting LookupTable[" << AtomNo << "] to " << *(*iter) << endl;
598 LookupTable[AtomNo] = (*iter);
599 } else {
600 Log() << Verbose(0) << "Walker " << *(*iter) << " exceeded range of nuclear ids [0, " << count << ")." << endl;
601 status = false;
602 break;
603 }
604 }
605 }
606
607 return status;
608};
609
[cee0b57]610/** Performs a many-body bond order analysis for a given bond order.
611 * -# parses adjacency, keysets and orderatsite files
612 * -# performs DFS to find connected subgraphs (to leave this in was a design decision: might be useful later)
613 * -# RootStack is created for every subgraph (here, later we implement the "update 10 sites with highest energ
614y contribution", and that's why this consciously not done in the following loop)
615 * -# in a loop over all subgraphs
616 * -# calls FragmentBOSSANOVA with this RootStack and within the subgraph molecule structure
617 * -# creates molecule (fragment)s from the returned keysets (StoreFragmentFromKeySet)
618 * -# combines the generated molecule lists from all subgraphs
619 * -# saves to disk: fragment configs, adjacency, orderatsite, keyset files
620 * Note that as we split "this" molecule up into a list of subgraphs, i.e. a MoleculeListClass, we have two sets
621 * of vertex indices: Global always means the index in "this" molecule, whereas local refers to the molecule or
622 * subgraph in the MoleculeListClass.
623 * \param Order up to how many neighbouring bonds a fragment contains in BondOrderScheme::BottumUp scheme
[35b698]624 * \param &prefix path and prefix of the bond order configs to be written
[cee0b57]625 * \return 1 - continue, 2 - stop (no fragmentation occured)
626 */
[35b698]627int molecule::FragmentMolecule(int Order, std::string &prefix)
[cee0b57]628{
629 MoleculeListClass *BondFragments = NULL;
[ea7176]630 int *MinimumRingSize = new int[getAtomCount()];
[cee0b57]631 int FragmentCounter;
632 MoleculeLeafClass *MolecularWalker = NULL;
633 MoleculeLeafClass *Subgraphs = NULL; // list of subgraphs from DFS analysis
634 fstream File;
635 bool FragmentationToDo = true;
[a564be]636 std::deque<bond *> *BackEdgeStack = NULL, *LocalBackEdgeStack = NULL;
[cee0b57]637 bool CheckOrder = false;
638 Graph **FragmentList = NULL;
639 Graph *ParsedFragmentList = NULL;
640 Graph TotalGraph; // graph with all keysets however local numbers
641 int TotalNumberOfKeySets = 0;
642 atom **ListOfAtoms = NULL;
643 atom ***ListOfLocalAtoms = NULL;
644 bool *AtomMask = NULL;
645
[a67d19]646 DoLog(0) && (Log() << Verbose(0) << endl);
[cee0b57]647#ifdef ADDHYDROGEN
[a67d19]648 DoLog(0) && (Log() << Verbose(0) << "I will treat hydrogen special and saturate dangling bonds with it." << endl);
[cee0b57]649#else
[a67d19]650 DoLog(0) && (Log() << Verbose(0) << "Hydrogen is treated just like the rest of the lot." << endl);
[cee0b57]651#endif
652
653 // ++++++++++++++++++++++++++++ INITIAL STUFF: Bond structure analysis, file parsing, ... ++++++++++++++++++++++++++++++++++++++++++
654
655 // ===== 1. Check whether bond structure is same as stored in files ====
656
[a479fa]657 // create lookup table for Atom::ParticleInfo_nr
[ea7176]658 FragmentationToDo = FragmentationToDo && CreateFatherLookupTable(ListOfAtoms, getAtomCount());
[cee0b57]659
660 // === compare it with adjacency file ===
[35b698]661 FragmentationToDo = FragmentationToDo && CheckAdjacencyFileAgainstMolecule(prefix, ListOfAtoms);
[920c70]662 delete[](ListOfAtoms);
[cee0b57]663
[48d43f]664 // === reset bond degree and perform CorrectBondDegree ===
665 for(World::MoleculeIterator iter = World::getInstance().getMoleculeIter();
666 iter != World::getInstance().moleculeEnd();
667 ++iter) {
668 // reset bond degree to 1
669 for (molecule::iterator atomiter = (*iter)->begin();
670 atomiter != (*iter)->end();
671 ++atomiter) {
[9d83b6]672 const BondList& ListOfBonds = (*atomiter)->getListOfBonds();
673 for (BondList::const_iterator bonditer = ListOfBonds.begin();
674 bonditer != ListOfBonds.end();
[48d43f]675 ++bonditer) {
676 (*bonditer)->BondDegree = 1;
677 }
678 }
679 // correct bond degree
680 (*iter)->CorrectBondDegree();
681 }
682
[cee0b57]683 // ===== 2. perform a DFS analysis to gather info on cyclic structure and a list of disconnected subgraphs =====
[e138de]684 Subgraphs = DepthFirstSearchAnalysis(BackEdgeStack);
[7218f8]685
[cee0b57]686 // analysis of the cycles (print rings, get minimum cycle length) for each subgraph
[ea7176]687 for(int i=getAtomCount();i--;)
688 MinimumRingSize[i] = getAtomCount();
[cee0b57]689 MolecularWalker = Subgraphs;
[c27778]690 const int LeafCount = Subgraphs->next->Count();
[cee0b57]691 FragmentCounter = 0;
692 while (MolecularWalker->next != NULL) {
693 MolecularWalker = MolecularWalker->next;
[7218f8]694 // fill the bond structure of the individually stored subgraphs
[c27778]695 ListOfAtoms = NULL;
696 MolecularWalker->FillBondStructureFromReference(this, ListOfAtoms, false); // we want to keep the created ListOfLocalAtoms
[a67d19]697 DoLog(0) && (Log() << Verbose(0) << "Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[a564be]698 LocalBackEdgeStack = new std::deque<bond *>; // (MolecularWalker->Leaf->BondCount);
[cee0b57]699// // check the list of local atoms for debugging
[e138de]700// Log() << Verbose(0) << "ListOfLocalAtoms for this subgraph is:" << endl;
[1024cb]701// for (int i=0;i<getAtomCount();i++)
[cee0b57]702// if (ListOfLocalAtoms[FragmentCounter][i] == NULL)
[e138de]703// Log() << Verbose(0) << "\tNULL";
[cee0b57]704// else
[e138de]705// Log() << Verbose(0) << "\t" << ListOfLocalAtoms[FragmentCounter][i]->Name;
[a67d19]706 DoLog(0) && (Log() << Verbose(0) << "Gathering local back edges for subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[c27778]707 MolecularWalker->Leaf->PickLocalBackEdges(ListOfAtoms, BackEdgeStack, LocalBackEdgeStack);
[a67d19]708 DoLog(0) && (Log() << Verbose(0) << "Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[e138de]709 MolecularWalker->Leaf->CyclicStructureAnalysis(LocalBackEdgeStack, MinimumRingSize);
[a67d19]710 DoLog(0) && (Log() << Verbose(0) << "Done with Analysing the cycles of subgraph " << MolecularWalker->Leaf << " with nr. " << FragmentCounter << "." << endl);
[cee0b57]711 delete(LocalBackEdgeStack);
[c27778]712 delete(ListOfAtoms);
713 FragmentCounter++;
[cee0b57]714 }
[7218f8]715 delete(BackEdgeStack);
[cee0b57]716
717 // ===== 3. if structure still valid, parse key set file and others =====
[35b698]718 FragmentationToDo = FragmentationToDo && ParseKeySetFile(prefix, ParsedFragmentList);
[cee0b57]719
720 // ===== 4. check globally whether there's something to do actually (first adaptivity check)
[35b698]721 FragmentationToDo = FragmentationToDo && ParseOrderAtSiteFromFile(prefix);
[cee0b57]722
723 // =================================== Begin of FRAGMENTATION ===============================
724 // ===== 6a. assign each keyset to its respective subgraph =====
[c27778]725 ListOfLocalAtoms = new atom **[LeafCount];
726 for (int i=0;i<LeafCount;i++)
727 ListOfLocalAtoms[i] = NULL;
728 FragmentCounter = 0;
729 Subgraphs->next->AssignKeySetsToFragment(this, ParsedFragmentList, ListOfLocalAtoms, FragmentList, FragmentCounter, true);
730 delete[](ListOfLocalAtoms);
[cee0b57]731
732 // ===== 6b. prepare and go into the adaptive (Order<0), single-step (Order==0) or incremental (Order>0) cycle
733 KeyStack *RootStack = new KeyStack[Subgraphs->next->Count()];
[ea7176]734 AtomMask = new bool[getAtomCount()+1];
735 AtomMask[getAtomCount()] = false;
[cee0b57]736 FragmentationToDo = false; // if CheckOrderAtSite just ones recommends fragmentation, we will save fragments afterwards
[35b698]737 while ((CheckOrder = CheckOrderAtSite(AtomMask, ParsedFragmentList, Order, MinimumRingSize, prefix))) {
[cee0b57]738 FragmentationToDo = FragmentationToDo || CheckOrder;
[ea7176]739 AtomMask[getAtomCount()] = true; // last plus one entry is used as marker that we have been through this loop once already in CheckOrderAtSite()
[cee0b57]740 // ===== 6b. fill RootStack for each subgraph (second adaptivity check) =====
[e138de]741 Subgraphs->next->FillRootStackForSubgraphs(RootStack, AtomMask, (FragmentCounter = 0));
[cee0b57]742
743 // ===== 7. fill the bond fragment list =====
744 FragmentCounter = 0;
745 MolecularWalker = Subgraphs;
746 while (MolecularWalker->next != NULL) {
747 MolecularWalker = MolecularWalker->next;
[a67d19]748 DoLog(1) && (Log() << Verbose(1) << "Fragmenting subgraph " << MolecularWalker << "." << endl);
[266237]749 //MolecularWalker->Leaf->OutputListOfBonds(out); // output atom::ListOfBonds for debugging
[e08c46]750 if (MolecularWalker->Leaf->hasBondStructure()) {
[cee0b57]751 // call BOSSANOVA method
[a67d19]752 DoLog(0) && (Log() << Verbose(0) << endl << " ========== BOND ENERGY of subgraph " << FragmentCounter << " ========================= " << endl);
[e138de]753 MolecularWalker->Leaf->FragmentBOSSANOVA(FragmentList[FragmentCounter], RootStack[FragmentCounter], MinimumRingSize);
[cee0b57]754 } else {
[58ed4a]755 DoeLog(1) && (eLog()<< Verbose(1) << "Subgraph " << MolecularWalker << " has no atoms!" << endl);
[cee0b57]756 }
757 FragmentCounter++; // next fragment list
758 }
759 }
[a67d19]760 DoLog(2) && (Log() << Verbose(2) << "CheckOrder is " << CheckOrder << "." << endl);
[cee0b57]761 delete[](RootStack);
762 delete[](AtomMask);
763 delete(ParsedFragmentList);
764 delete[](MinimumRingSize);
765
766 // ==================================== End of FRAGMENTATION ============================================
767
768 // ===== 8a. translate list into global numbers (i.e. ones that are valid in "this" molecule, not in MolecularWalker->Leaf)
[e138de]769 Subgraphs->next->TranslateIndicesToGlobalIDs(FragmentList, (FragmentCounter = 0), TotalNumberOfKeySets, TotalGraph);
[cee0b57]770
771 // free subgraph memory again
772 FragmentCounter = 0;
[00b59d5]773 while (Subgraphs != NULL) {
774 // remove entry in fragment list
775 // remove subgraph fragment
776 MolecularWalker = Subgraphs->next;
[cee0b57]777 delete(Subgraphs);
[00b59d5]778 Subgraphs = MolecularWalker;
[cee0b57]779 }
[00b59d5]780 // free fragment list
781 for (int i=0; i< FragmentCounter; ++i )
782 delete(FragmentList[i]);
[920c70]783 delete[](FragmentList);
[cee0b57]784
[00b59d5]785 DoLog(0) && (Log() << Verbose(0) << FragmentCounter-1 << " subgraph fragments have been removed." << std::endl);
786
[cee0b57]787 // ===== 8b. gather keyset lists (graphs) from all subgraphs and transform into MoleculeListClass =====
788 //if (FragmentationToDo) { // we should always store the fragments again as coordination might have changed slightly without changing bond structure
[7218f8]789 // allocate memory for the pointer array and transmorph graphs into full molecular fragments
[23b547]790 BondFragments = new MoleculeListClass(World::getPointer());
[7218f8]791 int k=0;
792 for(Graph::iterator runner = TotalGraph.begin(); runner != TotalGraph.end(); runner++) {
793 KeySet test = (*runner).first;
[a67d19]794 DoLog(0) && (Log() << Verbose(0) << "Fragment No." << (*runner).second.first << " with TEFactor " << (*runner).second.second << "." << endl);
[35b698]795 BondFragments->insert(StoreFragmentFromKeySet(test, World::getInstance().getConfig()));
[7218f8]796 k++;
797 }
[a67d19]798 DoLog(0) && (Log() << Verbose(0) << k << "/" << BondFragments->ListOfMolecules.size() << " fragments generated from the keysets." << endl);
[cee0b57]799
[7218f8]800 // ===== 9. Save fragments' configuration and keyset files et al to disk ===
801 if (BondFragments->ListOfMolecules.size() != 0) {
802 // create the SortIndex from BFS labels to order in the config file
[42af9e]803 int *SortIndex = NULL;
[e138de]804 CreateMappingLabelsToConfigSequence(SortIndex);
[cee0b57]805
[a67d19]806 DoLog(1) && (Log() << Verbose(1) << "Writing " << BondFragments->ListOfMolecules.size() << " possible bond fragmentation configs" << endl);
[35b698]807 if (BondFragments->OutputConfigForListOfFragments(prefix, SortIndex))
[a67d19]808 DoLog(1) && (Log() << Verbose(1) << "All configs written." << endl);
[7218f8]809 else
[a67d19]810 DoLog(1) && (Log() << Verbose(1) << "Some config writing failed." << endl);
[cee0b57]811
[7218f8]812 // store force index reference file
[35b698]813 BondFragments->StoreForcesFile(prefix, SortIndex);
[cee0b57]814
[7218f8]815 // store keysets file
[35b698]816 StoreKeySetFile(TotalGraph, prefix);
[cee0b57]817
[920c70]818 {
819 // store Adjacency file
[35b698]820 std::string filename = prefix + ADJACENCYFILE;
821 StoreAdjacencyToFile(filename);
[920c70]822 }
[cee0b57]823
[7218f8]824 // store Hydrogen saturation correction file
[35b698]825 BondFragments->AddHydrogenCorrection(prefix);
[cee0b57]826
[7218f8]827 // store adaptive orders into file
[35b698]828 StoreOrderAtSiteFile(prefix);
[cee0b57]829
[7218f8]830 // restore orbital and Stop values
[35b698]831 //CalculateOrbitals(*configuration);
[cee0b57]832
[7218f8]833 // free memory for bond part
[a67d19]834 DoLog(1) && (Log() << Verbose(1) << "Freeing bond memory" << endl);
[920c70]835 delete[](SortIndex);
[7218f8]836 } else {
[a67d19]837 DoLog(1) && (Log() << Verbose(1) << "FragmentList is zero on return, splitting failed." << endl);
[7218f8]838 }
[00b59d5]839 // remove all create molecules again from the World including their atoms
840 for (MoleculeList::iterator iter = BondFragments->ListOfMolecules.begin();
841 !BondFragments->ListOfMolecules.empty();
842 iter = BondFragments->ListOfMolecules.begin()) {
843 // remove copied atoms and molecule again
844 molecule *mol = *iter;
845 mol->removeAtomsinMolecule();
846 World::getInstance().destroyMolecule(mol);
847 BondFragments->ListOfMolecules.erase(iter);
848 }
[7218f8]849 delete(BondFragments);
[a67d19]850 DoLog(0) && (Log() << Verbose(0) << "End of bond fragmentation." << endl);
[cee0b57]851
852 return ((int)(!FragmentationToDo)+1); // 1 - continue, 2 - stop (no fragmentation occured)
853};
854
855
[a479fa]856/** Stores pairs (Atom::ParticleInfo_nr, Atom::AdaptiveOrder) into file.
[cee0b57]857 * Atoms not present in the file get "-1".
[35b698]858 * \param &path path to file ORDERATSITEFILE
[cee0b57]859 * \return true - file writable, false - not writable
860 */
[35b698]861bool molecule::StoreOrderAtSiteFile(std::string &path)
[cee0b57]862{
[35b698]863 string line;
[cee0b57]864 ofstream file;
865
[35b698]866 line = path + ORDERATSITEFILE;
867 file.open(line.c_str());
[a67d19]868 DoLog(1) && (Log() << Verbose(1) << "Writing OrderAtSite " << ORDERATSITEFILE << " ... " << endl);
[35b698]869 if (file.good()) {
[c743f8]870 for_each(atoms.begin(),atoms.end(),bind2nd(mem_fun(&atom::OutputOrder), &file));
[cee0b57]871 file.close();
[a67d19]872 DoLog(1) && (Log() << Verbose(1) << "done." << endl);
[cee0b57]873 return true;
874 } else {
[35b698]875 DoLog(1) && (Log() << Verbose(1) << "failed to open file " << line << "." << endl);
[cee0b57]876 return false;
877 }
878};
879
[a479fa]880/** Parses pairs(Atom::ParticleInfo_nr, Atom::AdaptiveOrder) from file and stores in molecule's Atom's.
[cee0b57]881 * Atoms not present in the file get "0".
[35b698]882 * \param &path path to file ORDERATSITEFILEe
[cee0b57]883 * \return true - file found and scanned, false - file not found
884 * \sa ParseKeySetFile() and CheckAdjacencyFileAgainstMolecule() as this is meant to be used in conjunction with the two
885 */
[35b698]886bool molecule::ParseOrderAtSiteFromFile(std::string &path)
[cee0b57]887{
[1024cb]888 unsigned char *OrderArray = new unsigned char[getAtomCount()];
889 bool *MaxArray = new bool[getAtomCount()];
[cee0b57]890 bool status;
891 int AtomNr, value;
[35b698]892 string line;
[cee0b57]893 ifstream file;
894
[1024cb]895 for(int i=0;i<getAtomCount();i++) {
[920c70]896 OrderArray[i] = 0;
897 MaxArray[i] = false;
898 }
899
[a67d19]900 DoLog(1) && (Log() << Verbose(1) << "Begin of ParseOrderAtSiteFromFile" << endl);
[35b698]901 line = path + ORDERATSITEFILE;
902 file.open(line.c_str());
903 if (file.good()) {
[cee0b57]904 while (!file.eof()) { // parse from file
905 AtomNr = -1;
906 file >> AtomNr;
907 if (AtomNr != -1) { // test whether we really parsed something (this is necessary, otherwise last atom is set twice and to 0 on second time)
908 file >> value;
909 OrderArray[AtomNr] = value;
910 file >> value;
911 MaxArray[AtomNr] = value;
[e138de]912 //Log() << Verbose(2) << "AtomNr " << AtomNr << " with order " << (int)OrderArray[AtomNr] << " and max order set to " << (int)MaxArray[AtomNr] << "." << endl;
[cee0b57]913 }
914 }
915 file.close();
[5034e1]916
917 // set atom values
[32ea56]918 for(internal_iterator iter=atoms.begin();iter!=atoms.end();++iter){
[a479fa]919 (*iter)->AdaptiveOrder = OrderArray[(*iter)->ParticleInfo_nr];
920 (*iter)->MaxOrder = MaxArray[(*iter)->ParticleInfo_nr];
[32ea56]921 }
[a479fa]922 //SetAtomValueToIndexedArray( OrderArray, &atom::ParticleInfo_nr, &atom::AdaptiveOrder );
923 //SetAtomValueToIndexedArray( MaxArray, &atom::ParticleInfo_nr, &atom::MaxOrder );
[5034e1]924
[0de7e8]925 DoLog(1) && (Log() << Verbose(1) << "\t ... done." << endl);
[cee0b57]926 status = true;
927 } else {
[35b698]928 DoLog(1) && (Log() << Verbose(1) << "\t ... failed to open file " << line << "." << endl);
[cee0b57]929 status = false;
930 }
[920c70]931 delete[](OrderArray);
932 delete[](MaxArray);
[cee0b57]933
[a67d19]934 DoLog(1) && (Log() << Verbose(1) << "End of ParseOrderAtSiteFromFile" << endl);
[cee0b57]935 return status;
936};
937
938
939
[a564be]940/** Looks through a std::deque<atom *> and returns the likeliest removal candiate.
[cee0b57]941 * \param *out output stream for debugging messages
942 * \param *&Leaf KeySet to look through
943 * \param *&ShortestPathList list of the shortest path to decide which atom to suggest as removal candidate in the end
944 * \param index of the atom suggested for removal
945 */
[e138de]946int molecule::LookForRemovalCandidate(KeySet *&Leaf, int *&ShortestPathList)
[cee0b57]947{
948 atom *Runner = NULL;
949 int SP, Removal;
950
[a67d19]951 DoLog(2) && (Log() << Verbose(2) << "Looking for removal candidate." << endl);
[cee0b57]952 SP = -1; //0; // not -1, so that Root is never removed
953 Removal = -1;
954 for (KeySet::iterator runner = Leaf->begin(); runner != Leaf->end(); runner++) {
955 Runner = FindAtom((*runner));
[83f176]956 if (Runner->getType()->getAtomicNumber() != 1) { // skip all those added hydrogens when re-filling snake stack
[cee0b57]957 if (ShortestPathList[(*runner)] > SP) { // remove the oldest one with longest shortest path
958 SP = ShortestPathList[(*runner)];
959 Removal = (*runner);
960 }
961 }
962 }
963 return Removal;
964};
965
[5034e1]966/** Initializes some value for putting fragment of \a *mol into \a *Leaf.
967 * \param *mol total molecule
968 * \param *Leaf fragment molecule
[cee0b57]969 * \param &Leaflet pointer to KeySet structure
[7218f8]970 * \param **SonList calloc'd list which atom of \a *Leaf is a son of which atom in \a *mol
[5034e1]971 * \return number of atoms in fragment
[cee0b57]972 */
[5034e1]973int StoreFragmentFromKeySet_Init(molecule *mol, molecule *Leaf, KeySet &Leaflet, atom **SonList)
[cee0b57]974{
[5034e1]975 atom *FatherOfRunner = NULL;
[cee0b57]976
[5034e1]977 Leaf->BondDistance = mol->BondDistance;
[cee0b57]978
979 // first create the minimal set of atoms from the KeySet
[5034e1]980 int size = 0;
[cee0b57]981 for(KeySet::iterator runner = Leaflet.begin(); runner != Leaflet.end(); runner++) {
[5034e1]982 FatherOfRunner = mol->FindAtom((*runner)); // find the id
[a479fa]983 SonList[FatherOfRunner->ParticleInfo_nr] = Leaf->AddCopyAtom(FatherOfRunner);
[cee0b57]984 size++;
985 }
[5034e1]986 return size;
987};
[cee0b57]988
[5034e1]989/** Creates an induced subgraph out of a fragmental key set, adding bonds and hydrogens (if treated specially).
990 * \param *out output stream for debugging messages
991 * \param *mol total molecule
992 * \param *Leaf fragment molecule
993 * \param IsAngstroem whether we have Ansgtroem or bohrradius
994 * \param **SonList list which atom of \a *Leaf is a son of which atom in \a *mol
995 */
[e138de]996void CreateInducedSubgraphOfFragment(molecule *mol, molecule *Leaf, atom **SonList, bool IsAngstroem)
[5034e1]997{
998 bool LonelyFlag = false;
999 atom *OtherFather = NULL;
1000 atom *FatherOfRunner = NULL;
1001
[9879f6]1002#ifdef ADDHYDROGEN
1003 molecule::const_iterator runner;
1004#endif
[a7b761b]1005 // we increment the iter just before skipping the hydrogen
1006 for (molecule::const_iterator iter = Leaf->begin(); iter != Leaf->end();) {
[cee0b57]1007 LonelyFlag = true;
[9879f6]1008 FatherOfRunner = (*iter)->father;
[a7b761b]1009 ASSERT(FatherOfRunner,"Atom without father found");
[a479fa]1010 if (SonList[FatherOfRunner->ParticleInfo_nr] != NULL) { // check if this, our father, is present in list
[cee0b57]1011 // create all bonds
[9d83b6]1012 const BondList& ListOfBonds = FatherOfRunner->getListOfBonds();
1013 for (BondList::const_iterator BondRunner = ListOfBonds.begin();
1014 BondRunner != ListOfBonds.end();
1015 ++BondRunner) {
[266237]1016 OtherFather = (*BondRunner)->GetOtherAtom(FatherOfRunner);
[a479fa]1017// Log() << Verbose(2) << "Father " << *FatherOfRunner << " of son " << *SonList[FatherOfRunner->ParticleInfo_nr] << " is bound to " << *OtherFather;
1018 if (SonList[OtherFather->ParticleInfo_nr] != NULL) {
1019// Log() << Verbose(0) << ", whose son is " << *SonList[OtherFather->ParticleInfo_nr] << "." << endl;
1020 if (OtherFather->ParticleInfo_nr > FatherOfRunner->ParticleInfo_nr) { // add bond (ParticleInfo_nr check is for adding only one of both variants: ab, ba)
[e138de]1021// Log() << Verbose(3) << "Adding Bond: ";
1022// Log() << Verbose(0) <<
[a479fa]1023 Leaf->AddBond((*iter), SonList[OtherFather->ParticleInfo_nr], (*BondRunner)->BondDegree);
[e138de]1024// Log() << Verbose(0) << "." << endl;
[a479fa]1025 //NumBonds[(*iter)->ParticleInfo_nr]++;
[cee0b57]1026 } else {
[e138de]1027// Log() << Verbose(3) << "Not adding bond, labels in wrong order." << endl;
[cee0b57]1028 }
1029 LonelyFlag = false;
1030 } else {
[e138de]1031// Log() << Verbose(0) << ", who has no son in this fragment molecule." << endl;
[cee0b57]1032#ifdef ADDHYDROGEN
[9879f6]1033 //Log() << Verbose(3) << "Adding Hydrogen to " << (*iter)->Name << " and a bond in between." << endl;
1034 if(!Leaf->AddHydrogenReplacementAtom((*BondRunner), (*iter), FatherOfRunner, OtherFather, IsAngstroem))
[cee0b57]1035 exit(1);
1036#endif
[a479fa]1037 //NumBonds[(*iter)->ParticleInfo_nr] += Binder->BondDegree;
[cee0b57]1038 }
1039 }
1040 } else {
[a479fa]1041 DoeLog(1) && (eLog()<< Verbose(1) << "Son " << (*iter)->getName() << " has father " << FatherOfRunner->getName() << " but its entry in SonList is " << SonList[FatherOfRunner->ParticleInfo_nr] << "!" << endl);
[cee0b57]1042 }
[ea7176]1043 if ((LonelyFlag) && (Leaf->getAtomCount() > 1)) {
[a7b761b]1044 DoLog(0) && (Log() << Verbose(0) << **iter << "has got bonds only to hydrogens!" << endl);
[cee0b57]1045 }
[a7b761b]1046 ++iter;
[cee0b57]1047#ifdef ADDHYDROGEN
[83f176]1048 while ((iter != Leaf->end()) && ((*iter)->getType()->getAtomicNumber() == 1)){ // skip added hydrogen
[9879f6]1049 iter++;
[a7b761b]1050 }
[cee0b57]1051#endif
1052 }
[5034e1]1053};
1054
1055/** Stores a fragment from \a KeySet into \a molecule.
1056 * First creates the minimal set of atoms from the KeySet, then creates the bond structure from the complete
1057 * molecule and adds missing hydrogen where bonds were cut.
1058 * \param *out output stream for debugging messages
1059 * \param &Leaflet pointer to KeySet structure
1060 * \param IsAngstroem whether we have Ansgtroem or bohrradius
1061 * \return pointer to constructed molecule
1062 */
[e138de]1063molecule * molecule::StoreFragmentFromKeySet(KeySet &Leaflet, bool IsAngstroem)
[5034e1]1064{
[1024cb]1065 atom **SonList = new atom*[getAtomCount()];
[23b547]1066 molecule *Leaf = World::getInstance().createMolecule();
[5034e1]1067
[1024cb]1068 for(int i=0;i<getAtomCount();i++)
[920c70]1069 SonList[i] = NULL;
1070
[e138de]1071// Log() << Verbose(1) << "Begin of StoreFragmentFromKeyset." << endl;
[5034e1]1072 StoreFragmentFromKeySet_Init(this, Leaf, Leaflet, SonList);
1073 // create the bonds between all: Make it an induced subgraph and add hydrogen
[e138de]1074// Log() << Verbose(2) << "Creating bonds from father graph (i.e. induced subgraph creation)." << endl;
1075 CreateInducedSubgraphOfFragment(this, Leaf, SonList, IsAngstroem);
[5034e1]1076
[cee0b57]1077 //Leaflet->Leaf->ScanForPeriodicCorrection(out);
[920c70]1078 delete[](SonList);
[e138de]1079// Log() << Verbose(1) << "End of StoreFragmentFromKeyset." << endl;
[cee0b57]1080 return Leaf;
1081};
1082
[d2943b]1083
1084/** Clears the touched list
1085 * \param *out output stream for debugging
1086 * \param verbosity verbosity level
1087 * \param *&TouchedList touched list
1088 * \param SubOrder current suborder
1089 * \param TouchedIndex currently touched
1090 */
[e138de]1091void SPFragmentGenerator_ClearingTouched(int verbosity, int *&TouchedList, int SubOrder, int &TouchedIndex)
[d2943b]1092{
[e138de]1093 Log() << Verbose(1+verbosity) << "Clearing touched list." << endl;
[d2943b]1094 for (TouchedIndex=SubOrder+1;TouchedIndex--;) // empty touched list
1095 TouchedList[TouchedIndex] = -1;
1096 TouchedIndex = 0;
1097
1098}
1099
1100/** Adds the current combination of the power set to the snake stack.
1101 * \param *out output stream for debugging
1102 * \param verbosity verbosity level
1103 * \param CurrentCombination
1104 * \param SetDimension maximum number of bits in power set
1105 * \param *FragmentSet snake stack to remove from
[03c77c]1106 * \param &BondsSet set of bonds
[d2943b]1107 * \param *&TouchedList touched list
1108 * \param TouchedIndex currently touched
1109 * \return number of set bits
1110 */
[03c77c]1111int AddPowersetToSnakeStack(int verbosity, int CurrentCombination, int SetDimension, KeySet *FragmentSet, std::vector<bond *> &BondsSet, int *&TouchedList, int &TouchedIndex)
[d2943b]1112{
1113 atom *OtherWalker = NULL;
1114 bool bit = false;
1115 KeySetTestPair TestKeySetInsert;
1116
1117 int Added = 0;
1118 for (int j=0;j<SetDimension;j++) { // pull out every bit by shifting
1119 bit = ((CurrentCombination & (1 << j)) != 0); // mask the bit for the j-th bond
1120 if (bit) { // if bit is set, we add this bond partner
1121 OtherWalker = BondsSet[j]->rightatom; // rightatom is always the one more distant, i.e. the one to add
[e138de]1122 //Log() << Verbose(1+verbosity) << "Current Bond is " << BondsSet[j] << ", checking on " << *OtherWalker << "." << endl;
[a479fa]1123 Log() << Verbose(2+verbosity) << "Adding " << *OtherWalker << " with nr " << OtherWalker->ParticleInfo_nr << "." << endl;
1124 TestKeySetInsert = FragmentSet->insert(OtherWalker->ParticleInfo_nr);
[d2943b]1125 if (TestKeySetInsert.second) {
[a479fa]1126 TouchedList[TouchedIndex++] = OtherWalker->ParticleInfo_nr; // note as added
[d2943b]1127 Added++;
1128 } else {
[e138de]1129 Log() << Verbose(2+verbosity) << "This was item was already present in the keyset." << endl;
[d2943b]1130 }
1131 } else {
[e138de]1132 Log() << Verbose(2+verbosity) << "Not adding." << endl;
[d2943b]1133 }
1134 }
1135 return Added;
1136};
1137
1138/** Counts the number of elements in a power set.
[03c77c]1139 * \param SetFirst begin iterator first bond
1140 * \param SetLast end iterator
[d2943b]1141 * \param *&TouchedList touched list
1142 * \param TouchedIndex currently touched
1143 * \return number of elements
1144 */
[03c77c]1145int CountSetMembers(std::list<bond *>::const_iterator SetFirst, std::list<bond *>::const_iterator SetLast, int *&TouchedList, int TouchedIndex)
[d2943b]1146{
1147 int SetDimension = 0;
[03c77c]1148 for( std::list<bond *>::const_iterator Binder = SetFirst;
1149 Binder != SetLast;
1150 ++Binder) {
[d2943b]1151 for (int k=TouchedIndex;k--;) {
[03c77c]1152 if ((*Binder)->Contains(TouchedList[k])) // if we added this very endpiece
[d2943b]1153 SetDimension++;
1154 }
1155 }
1156 return SetDimension;
1157};
1158
[03c77c]1159/** Fills a list of bonds from another
1160 * \param *BondsList bonds array/vector to fill
1161 * \param SetFirst begin iterator first bond
1162 * \param SetLast end iterator
[d2943b]1163 * \param *&TouchedList touched list
1164 * \param TouchedIndex currently touched
1165 * \return number of elements
1166 */
[03c77c]1167int FillBondsList(std::vector<bond *> &BondsList, std::list<bond *>::const_iterator SetFirst, std::list<bond *>::const_iterator SetLast, int *&TouchedList, int TouchedIndex)
[d2943b]1168{
1169 int SetDimension = 0;
[03c77c]1170 for( std::list<bond *>::const_iterator Binder = SetFirst;
1171 Binder != SetLast;
1172 ++Binder) {
[d2943b]1173 for (int k=0;k<TouchedIndex;k++) {
[a479fa]1174 if ((*Binder)->leftatom->ParticleInfo_nr == TouchedList[k]) // leftatom is always the closer one
[03c77c]1175 BondsList[SetDimension++] = (*Binder);
[d2943b]1176 }
1177 }
1178 return SetDimension;
1179};
1180
1181/** Remove all items that were added on this SP level.
1182 * \param *out output stream for debugging
1183 * \param verbosity verbosity level
1184 * \param *FragmentSet snake stack to remove from
1185 * \param *&TouchedList touched list
1186 * \param TouchedIndex currently touched
1187 */
[e138de]1188void RemoveAllTouchedFromSnakeStack(int verbosity, KeySet *FragmentSet, int *&TouchedList, int &TouchedIndex)
[d2943b]1189{
1190 int Removal = 0;
1191 for(int j=0;j<TouchedIndex;j++) {
1192 Removal = TouchedList[j];
[e138de]1193 Log() << Verbose(2+verbosity) << "Removing item nr. " << Removal << " from snake stack." << endl;
[d2943b]1194 FragmentSet->erase(Removal);
1195 TouchedList[j] = -1;
1196 }
[a67d19]1197 DoLog(2) && (Log() << Verbose(2) << "Remaining local nr.s on snake stack are: ");
[d2943b]1198 for(KeySet::iterator runner = FragmentSet->begin(); runner != FragmentSet->end(); runner++)
[a67d19]1199 DoLog(0) && (Log() << Verbose(0) << (*runner) << " ");
1200 DoLog(0) && (Log() << Verbose(0) << endl);
[d2943b]1201 TouchedIndex = 0; // set Index to 0 for list of atoms added on this level
1202};
1203
[cee0b57]1204/** From a given set of Bond sorted by Shortest Path distance, create all possible fragments of size \a SetDimension.
1205 * -# loops over every possible combination (2^dimension of edge set)
1206 * -# inserts current set, if there's still space left
1207 * -# yes: calls SPFragmentGenerator with structure, created new edge list and size respective to root dist
1208ance+1
1209 * -# no: stores fragment into keyset list by calling InsertFragmentIntoGraph
1210 * -# removes all items added into the snake stack (in UniqueFragments structure) added during level (root
1211distance) and current set
1212 * \param FragmentSearch UniqueFragments structure with all values needed
1213 * \param RootDistance current shortest path level, whose set of edges is represented by **BondsSet
[03c77c]1214 * \param BondsSet array of bonds to check
[cee0b57]1215 * \param SetDimension Number of possible bonds on this level (i.e. size of the array BondsSet[])
1216 * \param SubOrder remaining number of allowed vertices to add
1217 */
[03c77c]1218void molecule::SPFragmentGenerator(struct UniqueFragments *FragmentSearch, int RootDistance, std::vector<bond *> &BondsSet, int SetDimension, int SubOrder)
[cee0b57]1219{
1220 int verbosity = 0; //FragmentSearch->ANOVAOrder-SubOrder;
1221 int NumCombinations;
1222 int bits, TouchedIndex, SubSetDimension, SP, Added;
1223 int SpaceLeft;
[920c70]1224 int *TouchedList = new int[SubOrder + 1];
[cee0b57]1225 KeySetTestPair TestKeySetInsert;
1226
1227 NumCombinations = 1 << SetDimension;
1228
[266237]1229 // here for all bonds of Walker all combinations of end pieces (from the bonds)
1230 // have to be added and for the remaining ANOVA order GraphCrawler be called
1231 // recursively for the next level
[cee0b57]1232
[e138de]1233 Log() << Verbose(1+verbosity) << "Begin of SPFragmentGenerator." << endl;
1234 Log() << Verbose(1+verbosity) << "We are " << RootDistance << " away from Root, which is " << *FragmentSearch->Root << ", SubOrder is " << SubOrder << ", SetDimension is " << SetDimension << " and this means " << NumCombinations-1 << " combination(s)." << endl;
[cee0b57]1235
1236 // initialised touched list (stores added atoms on this level)
[e138de]1237 SPFragmentGenerator_ClearingTouched(verbosity, TouchedList, SubOrder, TouchedIndex);
[cee0b57]1238
1239 // create every possible combination of the endpieces
[e138de]1240 Log() << Verbose(1+verbosity) << "Going through all combinations of the power set." << endl;
[cee0b57]1241 for (int i=1;i<NumCombinations;i++) { // sweep through all power set combinations (skip empty set!)
1242 // count the set bit of i
1243 bits = 0;
1244 for (int j=SetDimension;j--;)
1245 bits += (i & (1 << j)) >> j;
1246
[e138de]1247 Log() << Verbose(1+verbosity) << "Current set is " << Binary(i | (1 << SetDimension)) << ", number of bits is " << bits << "." << endl;
[cee0b57]1248 if (bits <= SubOrder) { // if not greater than additional atoms allowed on stack, continue
1249 // --1-- add this set of the power set of bond partners to the snake stack
[e138de]1250 Added = AddPowersetToSnakeStack(verbosity, i, SetDimension, FragmentSearch->FragmentSet, BondsSet, TouchedList, TouchedIndex);
[cee0b57]1251
1252 SpaceLeft = SubOrder - Added ;// SubOrder - bits; // due to item's maybe being already present, this does not work anymore
1253 if (SpaceLeft > 0) {
[e138de]1254 Log() << Verbose(1+verbosity) << "There's still some space left on stack: " << SpaceLeft << "." << endl;
[cee0b57]1255 if (SubOrder > 1) { // Due to Added above we have to check extra whether we're not already reaching beyond the desired Order
1256 // --2-- look at all added end pieces of this combination, construct bond subsets and sweep through a power set of these by recursion
1257 SP = RootDistance+1; // this is the next level
[d2943b]1258
[cee0b57]1259 // first count the members in the subset
[03c77c]1260 SubSetDimension = CountSetMembers(FragmentSearch->BondsPerSPList[SP].begin(), FragmentSearch->BondsPerSPList[SP].end(), TouchedList, TouchedIndex);
[d2943b]1261
[cee0b57]1262 // then allocate and fill the list
[03c77c]1263 std::vector<bond *> BondsList;
1264 BondsList.resize(SubSetDimension);
1265 SubSetDimension = FillBondsList(BondsList, FragmentSearch->BondsPerSPList[SP].begin(), FragmentSearch->BondsPerSPList[SP].end(), TouchedList, TouchedIndex);
[d2943b]1266
1267 // then iterate
[e138de]1268 Log() << Verbose(2+verbosity) << "Calling subset generator " << SP << " away from root " << *FragmentSearch->Root << " with sub set dimension " << SubSetDimension << "." << endl;
1269 SPFragmentGenerator(FragmentSearch, SP, BondsList, SubSetDimension, SubOrder-bits);
[cee0b57]1270 }
1271 } else {
1272 // --2-- otherwise store the complete fragment
[e138de]1273 Log() << Verbose(1+verbosity) << "Enough items on stack for a fragment!" << endl;
[cee0b57]1274 // store fragment as a KeySet
[a67d19]1275 DoLog(2) && (Log() << Verbose(2) << "Found a new fragment[" << FragmentSearch->FragmentCounter << "], local nr.s are: ");
[cee0b57]1276 for(KeySet::iterator runner = FragmentSearch->FragmentSet->begin(); runner != FragmentSearch->FragmentSet->end(); runner++)
[a67d19]1277 DoLog(0) && (Log() << Verbose(0) << (*runner) << " ");
1278 DoLog(0) && (Log() << Verbose(0) << endl);
[e138de]1279 //if (!CheckForConnectedSubgraph(FragmentSearch->FragmentSet))
[58ed4a]1280 //DoeLog(1) && (eLog()<< Verbose(1) << "The found fragment is not a connected subgraph!" << endl);
[e138de]1281 InsertFragmentIntoGraph(FragmentSearch);
[cee0b57]1282 }
1283
1284 // --3-- remove all added items in this level from snake stack
[e138de]1285 Log() << Verbose(1+verbosity) << "Removing all items that were added on this SP level " << RootDistance << "." << endl;
1286 RemoveAllTouchedFromSnakeStack(verbosity, FragmentSearch->FragmentSet, TouchedList, TouchedIndex);
[cee0b57]1287 } else {
[e138de]1288 Log() << Verbose(2+verbosity) << "More atoms to add for this set (" << bits << ") than space left on stack " << SubOrder << ", skipping this set." << endl;
[cee0b57]1289 }
1290 }
[920c70]1291 delete[](TouchedList);
[e138de]1292 Log() << Verbose(1+verbosity) << "End of SPFragmentGenerator, " << RootDistance << " away from Root " << *FragmentSearch->Root << " and SubOrder is " << SubOrder << "." << endl;
[cee0b57]1293};
1294
[407536]1295/** Allocates memory for UniqueFragments::BondsPerSPList.
1296 * \param *out output stream
1297 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1298 * \param FragmentSearch UniqueFragments
1299 * \sa FreeSPList()
1300 */
[e138de]1301void InitialiseSPList(int Order, struct UniqueFragments &FragmentSearch)
[407536]1302{
[03c77c]1303 FragmentSearch.BondsPerSPList.resize(Order);
[920c70]1304 FragmentSearch.BondsPerSPCount = new int[Order];
[407536]1305 for (int i=Order;i--;) {
1306 FragmentSearch.BondsPerSPCount[i] = 0;
1307 }
1308};
1309
1310/** Free's memory for for UniqueFragments::BondsPerSPList.
1311 * \param *out output stream
1312 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1313 * \param FragmentSearch UniqueFragments\
1314 * \sa InitialiseSPList()
1315 */
[e138de]1316void FreeSPList(int Order, struct UniqueFragments &FragmentSearch)
[407536]1317{
[920c70]1318 delete[](FragmentSearch.BondsPerSPCount);
[407536]1319};
1320
1321/** Sets FragmenSearch to initial value.
[14e73a]1322 * Sets UniqueFragments::ShortestPathList entries to zero, UniqueFragments::BondsPerSPCount to zero (except zero level to 1) and
1323 * adds initial bond UniqueFragments::Root to UniqueFragments::Root to UniqueFragments::BondsPerSPList
1324 * \param *out output stream
[cee0b57]1325 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
[14e73a]1326 * \param FragmentSearch UniqueFragments
1327 * \sa FreeSPList()
[cee0b57]1328 */
[e138de]1329void SetSPList(int Order, struct UniqueFragments &FragmentSearch)
[cee0b57]1330{
1331 // prepare Label and SP arrays of the BFS search
[a479fa]1332 FragmentSearch.ShortestPathList[FragmentSearch.Root->ParticleInfo_nr] = 0;
[cee0b57]1333
1334 // prepare root level (SP = 0) and a loop bond denoting Root
[93d120]1335 for (int i=Order;i--;)
[cee0b57]1336 FragmentSearch.BondsPerSPCount[i] = 0;
1337 FragmentSearch.BondsPerSPCount[0] = 1;
[14e73a]1338 bond *Binder = new bond(FragmentSearch.Root, FragmentSearch.Root);
[03c77c]1339 FragmentSearch.BondsPerSPList[0].push_back(Binder);
[14e73a]1340};
[cee0b57]1341
[14e73a]1342/** Resets UniqueFragments::ShortestPathList and cleans bonds from UniqueFragments::BondsPerSPList.
1343 * \param *out output stream
1344 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1345 * \param FragmentSearch UniqueFragments
1346 * \sa InitialiseSPList()
1347 */
[e138de]1348void ResetSPList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1349{
[a67d19]1350 DoLog(0) && (Log() << Verbose(0) << "Free'ing all found lists. and resetting index lists" << endl);
[14e73a]1351 for(int i=Order;i--;) {
[a67d19]1352 DoLog(1) && (Log() << Verbose(1) << "Current SP level is " << i << ": ");
[03c77c]1353 for (UniqueFragments::BondsPerSP::const_iterator iter = FragmentSearch.BondsPerSPList[i].begin();
1354 iter != FragmentSearch.BondsPerSPList[i].end();
1355 ++iter) {
[a479fa]1356 // Log() << Verbose(0) << "Removing atom " << Binder->leftatom->ParticleInfo_nr << " and " << Binder->rightatom->ParticleInfo_nr << "." << endl; // make sure numbers are local
1357 FragmentSearch.ShortestPathList[(*iter)->leftatom->ParticleInfo_nr] = -1;
1358 FragmentSearch.ShortestPathList[(*iter)->rightatom->ParticleInfo_nr] = -1;
[14e73a]1359 }
1360 // delete added bonds
[03c77c]1361 for (UniqueFragments::BondsPerSP::iterator iter = FragmentSearch.BondsPerSPList[i].begin();
1362 iter != FragmentSearch.BondsPerSPList[i].end();
1363 ++iter) {
1364 delete(*iter);
1365 }
1366 FragmentSearch.BondsPerSPList[i].clear();
[14e73a]1367 // also start and end node
[a67d19]1368 DoLog(0) && (Log() << Verbose(0) << "cleaned." << endl);
[14e73a]1369 }
1370};
1371
1372
1373/** Fills the Bonds per Shortest Path List and set the vertex labels.
1374 * \param *out output stream
1375 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1376 * \param FragmentSearch UniqueFragments
1377 * \param *mol molecule with atoms and bonds
1378 * \param RestrictedKeySet Restricted vertex set to use in context of molecule
1379 */
[e138de]1380void FillSPListandLabelVertices(int Order, struct UniqueFragments &FragmentSearch, molecule *mol, KeySet RestrictedKeySet)
[14e73a]1381{
[cee0b57]1382 // Actually, we should construct a spanning tree vom the root atom and select all edges therefrom and put them into
1383 // according shortest path lists. However, we don't. Rather we fill these lists right away, as they do form a spanning
1384 // tree already sorted into various SP levels. That's why we just do loops over the depth (CurrentSP) and breadth
1385 // (EdgeinSPLevel) of this tree ...
1386 // In another picture, the bonds always contain a direction by rightatom being the one more distant from root and hence
1387 // naturally leftatom forming its predecessor, preventing the BFS"seeker" from continuing in the wrong direction.
[14e73a]1388 int AtomKeyNr = -1;
1389 atom *Walker = NULL;
1390 atom *OtherWalker = NULL;
1391 atom *Predecessor = NULL;
[266237]1392 bond *Binder = NULL;
[a479fa]1393 int RootKeyNr = FragmentSearch.Root->GetTrueFather()->ParticleInfo_nr;
[14e73a]1394 int RemainingWalkers = -1;
1395 int SP = -1;
1396
[a67d19]1397 DoLog(0) && (Log() << Verbose(0) << "Starting BFS analysis ..." << endl);
[cee0b57]1398 for (SP = 0; SP < (Order-1); SP++) {
[a67d19]1399 DoLog(1) && (Log() << Verbose(1) << "New SP level reached: " << SP << ", creating new SP list with " << FragmentSearch.BondsPerSPCount[SP] << " item(s)");
[cee0b57]1400 if (SP > 0) {
[a67d19]1401 DoLog(0) && (Log() << Verbose(0) << ", old level closed with " << FragmentSearch.BondsPerSPCount[SP-1] << " item(s)." << endl);
[cee0b57]1402 FragmentSearch.BondsPerSPCount[SP] = 0;
1403 } else
[a67d19]1404 DoLog(0) && (Log() << Verbose(0) << "." << endl);
[cee0b57]1405
1406 RemainingWalkers = FragmentSearch.BondsPerSPCount[SP];
[03c77c]1407 for (UniqueFragments::BondsPerSP::const_iterator CurrentEdge = FragmentSearch.BondsPerSPList[SP].begin();
1408 CurrentEdge != FragmentSearch.BondsPerSPList[SP].end();
1409 ++CurrentEdge) { /// start till end of this SP level's list
[cee0b57]1410 RemainingWalkers--;
[03c77c]1411 Walker = (*CurrentEdge)->rightatom; // rightatom is always the one more distant
1412 Predecessor = (*CurrentEdge)->leftatom; // ... and leftatom is predecessor
[a479fa]1413 AtomKeyNr = Walker->ParticleInfo_nr;
1414 DoLog(0) && (Log() << Verbose(0) << "Current Walker is: " << *Walker << " with nr " << Walker->ParticleInfo_nr << " and SP of " << SP << ", with " << RemainingWalkers << " remaining walkers on this level." << endl);
[cee0b57]1415 // check for new sp level
1416 // go through all its bonds
[a67d19]1417 DoLog(1) && (Log() << Verbose(1) << "Going through all bonds of Walker." << endl);
[9d83b6]1418 const BondList& ListOfBonds = Walker->getListOfBonds();
1419 for (BondList::const_iterator Runner = ListOfBonds.begin();
1420 Runner != ListOfBonds.end();
1421 ++Runner) {
[266237]1422 OtherWalker = (*Runner)->GetOtherAtom(Walker);
[a479fa]1423 if ((RestrictedKeySet.find(OtherWalker->ParticleInfo_nr) != RestrictedKeySet.end())
[cee0b57]1424 #ifdef ADDHYDROGEN
[83f176]1425 && (OtherWalker->getType()->getAtomicNumber() != 1)
[cee0b57]1426 #endif
1427 ) { // skip hydrogens and restrict to fragment
[a479fa]1428 DoLog(2) && (Log() << Verbose(2) << "Current partner is " << *OtherWalker << " with nr " << OtherWalker->ParticleInfo_nr << " in bond " << *(*Runner) << "." << endl);
[cee0b57]1429 // set the label if not set (and push on root stack as well)
[a479fa]1430 if ((OtherWalker != Predecessor) && (OtherWalker->GetTrueFather()->ParticleInfo_nr > RootKeyNr)) { // only pass through those with label bigger than Root's
1431 FragmentSearch.ShortestPathList[OtherWalker->ParticleInfo_nr] = SP+1;
1432 DoLog(3) && (Log() << Verbose(3) << "Set Shortest Path to " << FragmentSearch.ShortestPathList[OtherWalker->ParticleInfo_nr] << "." << endl);
[cee0b57]1433 // add the bond in between to the SP list
1434 Binder = new bond(Walker, OtherWalker); // create a new bond in such a manner, that bond::rightatom is always the one more distant
[03c77c]1435 FragmentSearch.BondsPerSPList[SP+1].push_back(Binder);
[cee0b57]1436 FragmentSearch.BondsPerSPCount[SP+1]++;
[a67d19]1437 DoLog(3) && (Log() << Verbose(3) << "Added its bond to SP list, having now " << FragmentSearch.BondsPerSPCount[SP+1] << " item(s)." << endl);
[cee0b57]1438 } else {
1439 if (OtherWalker != Predecessor)
[a479fa]1440 DoLog(3) && (Log() << Verbose(3) << "Not passing on, as index of " << *OtherWalker << " " << OtherWalker->GetTrueFather()->ParticleInfo_nr << " is smaller than that of Root " << RootKeyNr << "." << endl);
[cee0b57]1441 else
[a67d19]1442 DoLog(3) && (Log() << Verbose(3) << "This is my predecessor " << *Predecessor << "." << endl);
[cee0b57]1443 }
[e138de]1444 } else Log() << Verbose(2) << "Is not in the restricted keyset or skipping hydrogen " << *OtherWalker << "." << endl;
[cee0b57]1445 }
1446 }
1447 }
[14e73a]1448};
[cee0b57]1449
[14e73a]1450/** prints the Bonds per Shortest Path list in UniqueFragments.
1451 * \param *out output stream
1452 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1453 * \param FragmentSearch UniqueFragments
1454 */
[e138de]1455void OutputSPList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1456{
[a67d19]1457 DoLog(0) && (Log() << Verbose(0) << "Printing all found lists." << endl);
[cee0b57]1458 for(int i=1;i<Order;i++) { // skip the root edge in the printing
[a67d19]1459 DoLog(1) && (Log() << Verbose(1) << "Current SP level is " << i << "." << endl);
[03c77c]1460 for (UniqueFragments::BondsPerSP::const_iterator Binder = FragmentSearch.BondsPerSPList[i].begin();
1461 Binder != FragmentSearch.BondsPerSPList[i].end();
1462 ++Binder) {
[a67d19]1463 DoLog(2) && (Log() << Verbose(2) << *Binder << endl);
[cee0b57]1464 }
1465 }
[14e73a]1466};
[cee0b57]1467
[14e73a]1468/** Simply counts all bonds in all UniqueFragments::BondsPerSPList lists.
1469 * \param *out output stream
1470 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1471 * \param FragmentSearch UniqueFragments
1472 */
[e138de]1473int CountNumbersInBondsList(int Order, struct UniqueFragments &FragmentSearch)
[14e73a]1474{
1475 int SP = -1; // the Root <-> Root edge must be subtracted!
[cee0b57]1476 for(int i=Order;i--;) { // sum up all found edges
[03c77c]1477 for (UniqueFragments::BondsPerSP::const_iterator Binder = FragmentSearch.BondsPerSPList[i].begin();
1478 Binder != FragmentSearch.BondsPerSPList[i].end();
1479 ++Binder) {
[93d120]1480 SP++;
[cee0b57]1481 }
1482 }
[14e73a]1483 return SP;
1484};
1485
1486/** Creates a list of all unique fragments of certain vertex size from a given graph \a Fragment for a given root vertex in the context of \a this molecule.
1487 * -# initialises UniqueFragments structure
1488 * -# fills edge list via BFS
1489 * -# creates the fragment by calling recursive function SPFragmentGenerator with UniqueFragments structure, 0 as
1490 root distance, the edge set, its dimension and the current suborder
1491 * -# Free'ing structure
1492 * Note that we may use the fact that the atoms are SP-ordered on the atomstack. I.e. when popping always the last, we first get all
1493 * with SP of 2, then those with SP of 3, then those with SP of 4 and so on.
1494 * \param *out output stream for debugging
1495 * \param Order bond order (limits BFS exploration and "number of digits" in power set generation
1496 * \param FragmentSearch UniqueFragments structure containing TEFactor, root atom and so on
1497 * \param RestrictedKeySet Restricted vertex set to use in context of molecule
1498 * \return number of inserted fragments
1499 * \note ShortestPathList in FragmentSearch structure is probably due to NumberOfAtomsSPLevel and SP not needed anymore
1500 */
[e138de]1501int molecule::PowerSetGenerator(int Order, struct UniqueFragments &FragmentSearch, KeySet RestrictedKeySet)
[14e73a]1502{
1503 int Counter = FragmentSearch.FragmentCounter; // mark current value of counter
1504
[a67d19]1505 DoLog(0) && (Log() << Verbose(0) << endl);
1506 DoLog(0) && (Log() << Verbose(0) << "Begin of PowerSetGenerator with order " << Order << " at Root " << *FragmentSearch.Root << "." << endl);
[14e73a]1507
[e138de]1508 SetSPList(Order, FragmentSearch);
[14e73a]1509
1510 // do a BFS search to fill the SP lists and label the found vertices
[e138de]1511 FillSPListandLabelVertices(Order, FragmentSearch, this, RestrictedKeySet);
[14e73a]1512
1513 // outputting all list for debugging
[e138de]1514 OutputSPList(Order, FragmentSearch);
[14e73a]1515
1516 // creating fragments with the found edge sets (may be done in reverse order, faster)
[e138de]1517 int SP = CountNumbersInBondsList(Order, FragmentSearch);
[a67d19]1518 DoLog(0) && (Log() << Verbose(0) << "Total number of edges is " << SP << "." << endl);
[cee0b57]1519 if (SP >= (Order-1)) {
1520 // start with root (push on fragment stack)
[a479fa]1521 DoLog(0) && (Log() << Verbose(0) << "Starting fragment generation with " << *FragmentSearch.Root << ", local nr is " << FragmentSearch.Root->ParticleInfo_nr << "." << endl);
[cee0b57]1522 FragmentSearch.FragmentSet->clear();
[a67d19]1523 DoLog(0) && (Log() << Verbose(0) << "Preparing subset for this root and calling generator." << endl);
[14e73a]1524
[cee0b57]1525 // prepare the subset and call the generator
[03c77c]1526 std::vector<bond*> BondsList;
1527 BondsList.resize(FragmentSearch.BondsPerSPCount[0]);
1528 ASSERT(FragmentSearch.BondsPerSPList[0].size() != 0,
1529 "molecule::PowerSetGenerator() - FragmentSearch.BondsPerSPList[0] contains no root bond.");
1530 BondsList[0] = (*FragmentSearch.BondsPerSPList[0].begin()); // on SP level 0 there's only the root bond
[cee0b57]1531
[e138de]1532 SPFragmentGenerator(&FragmentSearch, 0, BondsList, FragmentSearch.BondsPerSPCount[0], Order);
[cee0b57]1533 } else {
[a67d19]1534 DoLog(0) && (Log() << Verbose(0) << "Not enough total number of edges to build " << Order << "-body fragments." << endl);
[cee0b57]1535 }
1536
1537 // as FragmentSearch structure is used only once, we don't have to clean it anymore
1538 // remove root from stack
[a67d19]1539 DoLog(0) && (Log() << Verbose(0) << "Removing root again from stack." << endl);
[a479fa]1540 FragmentSearch.FragmentSet->erase(FragmentSearch.Root->ParticleInfo_nr);
[cee0b57]1541
1542 // free'ing the bonds lists
[e138de]1543 ResetSPList(Order, FragmentSearch);
[cee0b57]1544
1545 // return list
[a67d19]1546 DoLog(0) && (Log() << Verbose(0) << "End of PowerSetGenerator." << endl);
[cee0b57]1547 return (FragmentSearch.FragmentCounter - Counter);
1548};
1549
1550bool KeyCompare::operator() (const KeySet SubgraphA, const KeySet SubgraphB) const
1551{
[e138de]1552 //Log() << Verbose(0) << "my check is used." << endl;
[cee0b57]1553 if (SubgraphA.size() < SubgraphB.size()) {
1554 return true;
1555 } else {
1556 if (SubgraphA.size() > SubgraphB.size()) {
1557 return false;
1558 } else {
1559 KeySet::iterator IteratorA = SubgraphA.begin();
1560 KeySet::iterator IteratorB = SubgraphB.begin();
1561 while ((IteratorA != SubgraphA.end()) && (IteratorB != SubgraphB.end())) {
1562 if ((*IteratorA) < (*IteratorB))
1563 return true;
1564 else if ((*IteratorA) > (*IteratorB)) {
1565 return false;
1566 } // else, go on to next index
1567 IteratorA++;
1568 IteratorB++;
1569 } // end of while loop
1570 }// end of check in case of equal sizes
1571 }
1572 return false; // if we reach this point, they are equal
1573};
1574
1575
[407536]1576/** Combines all KeySets from all orders into single ones (with just unique entries).
1577 * \param *out output stream for debugging
1578 * \param *&FragmentList list to fill
1579 * \param ***FragmentLowerOrdersList
1580 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1581 * \param *mol molecule with atoms and bonds
1582 */
[e138de]1583int CombineAllOrderListIntoOne(Graph *&FragmentList, Graph ***FragmentLowerOrdersList, KeyStack &RootStack, molecule *mol)
[407536]1584{
1585 int RootNr = 0;
1586 int RootKeyNr = 0;
[93d120]1587 int StartNr = 0;
[407536]1588 int counter = 0;
1589 int NumLevels = 0;
1590 atom *Walker = NULL;
1591
[a67d19]1592 DoLog(0) && (Log() << Verbose(0) << "Combining the lists of all orders per order and finally into a single one." << endl);
[407536]1593 if (FragmentList == NULL) {
1594 FragmentList = new Graph;
1595 counter = 0;
1596 } else {
1597 counter = FragmentList->size();
1598 }
[93d120]1599
1600 StartNr = RootStack.back();
1601 do {
[407536]1602 RootKeyNr = RootStack.front();
1603 RootStack.pop_front();
1604 Walker = mol->FindAtom(RootKeyNr);
1605 NumLevels = 1 << (Walker->AdaptiveOrder - 1);
1606 for(int i=0;i<NumLevels;i++) {
1607 if (FragmentLowerOrdersList[RootNr][i] != NULL) {
[e138de]1608 InsertGraphIntoGraph(*FragmentList, (*FragmentLowerOrdersList[RootNr][i]), &counter);
[407536]1609 }
1610 }
[a479fa]1611 RootStack.push_back(Walker->ParticleInfo_nr);
[407536]1612 RootNr++;
[93d120]1613 } while (RootKeyNr != StartNr);
[407536]1614 return counter;
1615};
1616
1617/** Free's memory allocated for all KeySets from all orders.
1618 * \param *out output stream for debugging
1619 * \param ***FragmentLowerOrdersList
1620 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1621 * \param *mol molecule with atoms and bonds
1622 */
[e138de]1623void FreeAllOrdersList(Graph ***FragmentLowerOrdersList, KeyStack &RootStack, molecule *mol)
[407536]1624{
[a67d19]1625 DoLog(1) && (Log() << Verbose(1) << "Free'ing the lists of all orders per order." << endl);
[407536]1626 int RootNr = 0;
1627 int RootKeyNr = 0;
1628 int NumLevels = 0;
1629 atom *Walker = NULL;
1630 while (!RootStack.empty()) {
1631 RootKeyNr = RootStack.front();
1632 RootStack.pop_front();
1633 Walker = mol->FindAtom(RootKeyNr);
1634 NumLevels = 1 << (Walker->AdaptiveOrder - 1);
1635 for(int i=0;i<NumLevels;i++) {
1636 if (FragmentLowerOrdersList[RootNr][i] != NULL) {
1637 delete(FragmentLowerOrdersList[RootNr][i]);
1638 }
1639 }
[920c70]1640 delete[](FragmentLowerOrdersList[RootNr]);
[407536]1641 RootNr++;
1642 }
[920c70]1643 delete[](FragmentLowerOrdersList);
[407536]1644};
1645
1646
[cee0b57]1647/** Performs BOSSANOVA decomposition at selected sites, increasing the cutoff by one at these sites.
1648 * -# constructs a complete keyset of the molecule
1649 * -# In a loop over all possible roots from the given rootstack
1650 * -# increases order of root site
1651 * -# calls PowerSetGenerator with this order, the complete keyset and the rootkeynr
1652 * -# for all consecutive lower levels PowerSetGenerator is called with the suborder, the higher order keyset
1653as the restricted one and each site in the set as the root)
1654 * -# these are merged into a fragment list of keysets
1655 * -# All fragment lists (for all orders, i.e. from all destination fields) are merged into one list for return
1656 * Important only is that we create all fragments, it is not important if we create them more than once
1657 * as these copies are filtered out via use of the hash table (KeySet).
1658 * \param *out output stream for debugging
1659 * \param Fragment&*List list of already present keystacks (adaptive scheme) or empty list
1660 * \param &RootStack stack with all root candidates (unequal to each atom in complete molecule if adaptive scheme is applied)
1661 * \param *MinimumRingSize minimum ring size for each atom (molecule::Atomcount)
1662 * \return pointer to Graph list
1663 */
[e138de]1664void molecule::FragmentBOSSANOVA(Graph *&FragmentList, KeyStack &RootStack, int *MinimumRingSize)
[cee0b57]1665{
1666 Graph ***FragmentLowerOrdersList = NULL;
[407536]1667 int NumLevels = 0;
1668 int NumMolecules = 0;
1669 int TotalNumMolecules = 0;
1670 int *NumMoleculesOfOrder = NULL;
1671 int Order = 0;
[cee0b57]1672 int UpgradeCount = RootStack.size();
1673 KeyStack FragmentRootStack;
[407536]1674 int RootKeyNr = 0;
1675 int RootNr = 0;
[cee0b57]1676 struct UniqueFragments FragmentSearch;
1677
[a67d19]1678 DoLog(0) && (Log() << Verbose(0) << "Begin of FragmentBOSSANOVA." << endl);
[cee0b57]1679
1680 // FragmentLowerOrdersList is a 2D-array of pointer to MoleculeListClass objects, one dimension represents the ANOVA expansion of a single order (i.e. 5)
1681 // with all needed lower orders that are subtracted, the other dimension is the BondOrder (i.e. from 1 to 5)
[920c70]1682 NumMoleculesOfOrder = new int[UpgradeCount];
1683 FragmentLowerOrdersList = new Graph**[UpgradeCount];
1684
1685 for(int i=0;i<UpgradeCount;i++) {
1686 NumMoleculesOfOrder[i] = 0;
1687 FragmentLowerOrdersList[i] = NULL;
1688 }
[cee0b57]1689
1690 // initialise the fragments structure
1691 FragmentSearch.FragmentCounter = 0;
1692 FragmentSearch.FragmentSet = new KeySet;
1693 FragmentSearch.Root = FindAtom(RootKeyNr);
[1024cb]1694 FragmentSearch.ShortestPathList = new int[getAtomCount()];
[ea7176]1695 for (int i=getAtomCount();i--;) {
[cee0b57]1696 FragmentSearch.ShortestPathList[i] = -1;
1697 }
1698
1699 // Construct the complete KeySet which we need for topmost level only (but for all Roots)
1700 KeySet CompleteMolecule;
[9879f6]1701 for (molecule::const_iterator iter = begin(); iter != end(); ++iter) {
[a479fa]1702 CompleteMolecule.insert((*iter)->GetTrueFather()->ParticleInfo_nr);
[cee0b57]1703 }
1704
1705 // this can easily be seen: if Order is 5, then the number of levels for each lower order is the total sum of the number of levels above, as
1706 // each has to be split up. E.g. for the second level we have one from 5th, one from 4th, two from 3th (which in turn is one from 5th, one from 4th),
1707 // hence we have overall four 2th order levels for splitting. This also allows for putting all into a single array (FragmentLowerOrdersList[])
1708 // with the order along the cells as this: 5433222211111111 for BondOrder 5 needing 16=pow(2,5-1) cells (only we use bit-shifting which is faster)
1709 RootNr = 0; // counts through the roots in RootStack
1710 while ((RootNr < UpgradeCount) && (!RootStack.empty())) {
1711 RootKeyNr = RootStack.front();
1712 RootStack.pop_front();
[9879f6]1713 atom *Walker = FindAtom(RootKeyNr);
[cee0b57]1714 // check cyclic lengths
[a479fa]1715 //if ((MinimumRingSize[Walker->GetTrueFather()->ParticleInfo_nr] != -1) && (Walker->GetTrueFather()->AdaptiveOrder+1 > MinimumRingSize[Walker->GetTrueFather()->ParticleInfo_nr])) {
[e138de]1716 // Log() << Verbose(0) << "Bond order " << Walker->GetTrueFather()->AdaptiveOrder << " of Root " << *Walker << " greater than or equal to Minimum Ring size of " << MinimumRingSize << " found is not allowed." << endl;
[cee0b57]1717 //} else
1718 {
1719 // increase adaptive order by one
1720 Walker->GetTrueFather()->AdaptiveOrder++;
1721 Order = Walker->AdaptiveOrder = Walker->GetTrueFather()->AdaptiveOrder;
1722
1723 // initialise Order-dependent entries of UniqueFragments structure
[e138de]1724 InitialiseSPList(Order, FragmentSearch);
[cee0b57]1725
1726 // allocate memory for all lower level orders in this 1D-array of ptrs
1727 NumLevels = 1 << (Order-1); // (int)pow(2,Order);
[920c70]1728 FragmentLowerOrdersList[RootNr] = new Graph*[NumLevels];
1729 for (int i=0;i<NumLevels;i++)
1730 FragmentLowerOrdersList[RootNr][i] = NULL;
[cee0b57]1731
1732 // create top order where nothing is reduced
[a67d19]1733 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
1734 DoLog(0) && (Log() << Verbose(0) << "Creating KeySets of Bond Order " << Order << " for " << *Walker << ", " << (RootStack.size()-RootNr) << " Roots remaining." << endl); // , NumLevels is " << NumLevels << "
[cee0b57]1735
1736 // Create list of Graphs of current Bond Order (i.e. F_{ij})
1737 FragmentLowerOrdersList[RootNr][0] = new Graph;
1738 FragmentSearch.TEFactor = 1.;
1739 FragmentSearch.Leaflet = FragmentLowerOrdersList[RootNr][0]; // set to insertion graph
1740 FragmentSearch.Root = Walker;
[e138de]1741 NumMoleculesOfOrder[RootNr] = PowerSetGenerator(Walker->AdaptiveOrder, FragmentSearch, CompleteMolecule);
[407536]1742
1743 // output resulting number
[a67d19]1744 DoLog(1) && (Log() << Verbose(1) << "Number of resulting KeySets is: " << NumMoleculesOfOrder[RootNr] << "." << endl);
[cee0b57]1745 if (NumMoleculesOfOrder[RootNr] != 0) {
1746 NumMolecules = 0;
1747 } else {
1748 Walker->GetTrueFather()->MaxOrder = true;
1749 }
1750 // now, we have completely filled each cell of FragmentLowerOrdersList[] for the current Walker->AdaptiveOrder
1751 //NumMoleculesOfOrder[Walker->AdaptiveOrder-1] = NumMolecules;
1752 TotalNumMolecules += NumMoleculesOfOrder[RootNr];
[e138de]1753// Log() << Verbose(1) << "Number of resulting molecules for Order " << (int)Walker->GetTrueFather()->AdaptiveOrder << " is: " << NumMoleculesOfOrder[RootNr] << "." << endl;
[cee0b57]1754 RootStack.push_back(RootKeyNr); // put back on stack
1755 RootNr++;
1756
1757 // free Order-dependent entries of UniqueFragments structure for next loop cycle
[e138de]1758 FreeSPList(Order, FragmentSearch);
[cee0b57]1759 }
1760 }
[a67d19]1761 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
1762 DoLog(1) && (Log() << Verbose(1) << "Total number of resulting molecules is: " << TotalNumMolecules << "." << endl);
1763 DoLog(0) && (Log() << Verbose(0) << "==============================================================================================================" << endl);
[cee0b57]1764
1765 // cleanup FragmentSearch structure
[920c70]1766 delete[](FragmentSearch.ShortestPathList);
[cee0b57]1767 delete(FragmentSearch.FragmentSet);
1768
1769 // now, FragmentLowerOrdersList is complete, it looks - for BondOrder 5 - as this (number is the ANOVA Order of the terms therein)
1770 // 5433222211111111
1771 // 43221111
1772 // 3211
1773 // 21
1774 // 1
1775
1776 // Subsequently, we combine all into a single list (FragmentList)
[e138de]1777 CombineAllOrderListIntoOne(FragmentList, FragmentLowerOrdersList, RootStack, this);
1778 FreeAllOrdersList(FragmentLowerOrdersList, RootStack, this);
[920c70]1779 delete[](NumMoleculesOfOrder);
[cee0b57]1780
[a67d19]1781 DoLog(0) && (Log() << Verbose(0) << "End of FragmentBOSSANOVA." << endl);
[cee0b57]1782};
1783
1784/** Corrects the nuclei position if the fragment was created over the cell borders.
1785 * Scans all bonds, checks the distance, if greater than typical, we have a candidate for the correction.
1786 * We remove the bond whereafter the graph probably separates. Then, we translate the one component periodically
1787 * and re-add the bond. Looping on the distance check.
1788 * \param *out ofstream for debugging messages
1789 */
[3c58f8]1790bool molecule::ScanForPeriodicCorrection()
[cee0b57]1791{
1792 bond *Binder = NULL;
[03c77c]1793 //bond *OtherBinder = NULL;
[cee0b57]1794 atom *Walker = NULL;
1795 atom *OtherWalker = NULL;
[cca9ef]1796 RealSpaceMatrix matrix = World::getInstance().getDomain().getM();
[cee0b57]1797 enum Shading *ColorList = NULL;
1798 double tmp;
[03c77c]1799 //bool LastBond = true; // only needed to due list construct
[cee0b57]1800 Vector Translationvector;
[a564be]1801 //std::deque<atom *> *CompStack = NULL;
1802 std::deque<atom *> *AtomStack = new std::deque<atom *>; // (getAtomCount());
[cee0b57]1803 bool flag = true;
1804
[a67d19]1805 DoLog(2) && (Log() << Verbose(2) << "Begin of ScanForPeriodicCorrection." << endl);
[cee0b57]1806
[1024cb]1807 ColorList = new enum Shading[getAtomCount()];
1808 for (int i=0;i<getAtomCount();i++)
[920c70]1809 ColorList[i] = (enum Shading)0;
[3c58f8]1810 if (flag) {
[cee0b57]1811 // remove bonds that are beyond bonddistance
[d4c9ae]1812 Translationvector.Zero();
[cee0b57]1813 // scan all bonds
1814 flag = false;
[9d83b6]1815 for(molecule::iterator AtomRunner = begin(); (!flag) && (AtomRunner != end()); ++AtomRunner) {
1816 const BondList& ListOfBonds = (*AtomRunner)->getListOfBonds();
1817 for(BondList::const_iterator BondRunner = ListOfBonds.begin();
1818 (!flag) && (BondRunner != ListOfBonds.end());
1819 ++BondRunner) {
[e08c46]1820 Binder = (*BondRunner);
1821 for (int i=NDIM;i--;) {
[d74077]1822 tmp = fabs(Binder->leftatom->at(i) - Binder->rightatom->at(i));
[e08c46]1823 //Log() << Verbose(3) << "Checking " << i << "th distance of " << *Binder->leftatom << " to " << *Binder->rightatom << ": " << tmp << "." << endl;
1824 if (tmp > BondDistance) {
1825 DoLog(2) && (Log() << Verbose(2) << "Correcting at bond " << *Binder << "." << endl);
1826 flag = true;
1827 break;
1828 }
[cee0b57]1829 }
1830 }
[9d83b6]1831 }
[3c58f8]1832 //if (flag) {
1833 if (0) {
[cee0b57]1834 // create translation vector from their periodically modified distance
1835 for (int i=NDIM;i--;) {
[d74077]1836 tmp = Binder->leftatom->at(i) - Binder->rightatom->at(i);
[cee0b57]1837 if (fabs(tmp) > BondDistance)
[0a4f7f]1838 Translationvector[i] = (tmp < 0) ? +1. : -1.;
[cee0b57]1839 }
[5108e1]1840 Translationvector *= matrix;
[e138de]1841 //Log() << Verbose(3) << "Translation vector is ";
[0a4f7f]1842 Log() << Verbose(0) << Translationvector << endl;
[cee0b57]1843 // apply to all atoms of first component via BFS
[ea7176]1844 for (int i=getAtomCount();i--;)
[cee0b57]1845 ColorList[i] = white;
[a564be]1846 AtomStack->push_front(Binder->leftatom);
1847 while (!AtomStack->empty()) {
1848 Walker = AtomStack->front();
1849 AtomStack->pop_front();
[e138de]1850 //Log() << Verbose (3) << "Current Walker is: " << *Walker << "." << endl;
[a479fa]1851 ColorList[Walker->ParticleInfo_nr] = black; // mark as explored
[d74077]1852 *Walker += Translationvector; // translate
[9d83b6]1853 const BondList& ListOfBonds = Walker->getListOfBonds();
1854 for (BondList::const_iterator Runner = ListOfBonds.begin();
1855 Runner != ListOfBonds.end();
1856 ++Runner) {
[266237]1857 if ((*Runner) != Binder) {
1858 OtherWalker = (*Runner)->GetOtherAtom(Walker);
[a479fa]1859 if (ColorList[OtherWalker->ParticleInfo_nr] == white) {
[a564be]1860 AtomStack->push_front(OtherWalker); // push if yet unexplored
[cee0b57]1861 }
1862 }
1863 }
1864 }
[03c77c]1865// // re-add bond
1866// if (OtherBinder == NULL) { // is the only bond?
1867// //Do nothing
1868// } else {
1869// if (!LastBond) {
1870// link(Binder, OtherBinder); // no more implemented bond::previous ...
1871// } else {
1872// link(OtherBinder, Binder); // no more implemented bond::previous ...
1873// }
1874// }
[cee0b57]1875 } else {
[a67d19]1876 DoLog(3) && (Log() << Verbose(3) << "No corrections for this fragment." << endl);
[cee0b57]1877 }
1878 //delete(CompStack);
1879 }
1880 // free allocated space from ReturnFullMatrixforSymmetric()
1881 delete(AtomStack);
[920c70]1882 delete[](ColorList);
[a67d19]1883 DoLog(2) && (Log() << Verbose(2) << "End of ScanForPeriodicCorrection." << endl);
[3c58f8]1884
1885 return flag;
[cee0b57]1886};
Note: See TracBrowser for help on using the repository browser.