| [13a953] | 1 | /*
 | 
|---|
 | 2 |  * Project: MoleCuilder
 | 
|---|
 | 3 |  * Description: creates and alters molecular systems
 | 
|---|
| [0aa122] | 4 |  * Copyright (C)  2010-2012 University of Bonn. All rights reserved.
 | 
|---|
| [94d5ac6] | 5 |  * 
 | 
|---|
 | 6 |  *
 | 
|---|
 | 7 |  *   This file is part of MoleCuilder.
 | 
|---|
 | 8 |  *
 | 
|---|
 | 9 |  *    MoleCuilder is free software: you can redistribute it and/or modify
 | 
|---|
 | 10 |  *    it under the terms of the GNU General Public License as published by
 | 
|---|
 | 11 |  *    the Free Software Foundation, either version 2 of the License, or
 | 
|---|
 | 12 |  *    (at your option) any later version.
 | 
|---|
 | 13 |  *
 | 
|---|
 | 14 |  *    MoleCuilder is distributed in the hope that it will be useful,
 | 
|---|
 | 15 |  *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
|---|
 | 16 |  *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
|---|
 | 17 |  *    GNU General Public License for more details.
 | 
|---|
 | 18 |  *
 | 
|---|
 | 19 |  *    You should have received a copy of the GNU General Public License
 | 
|---|
 | 20 |  *    along with MoleCuilder.  If not, see <http://www.gnu.org/licenses/>.
 | 
|---|
| [13a953] | 21 |  */
 | 
|---|
 | 22 | 
 | 
|---|
 | 23 | /*
 | 
|---|
 | 24 |  * CheckAgainstAdjacencyFile.cpp
 | 
|---|
 | 25 |  *
 | 
|---|
 | 26 |  *  Created on: Mar 3, 2011
 | 
|---|
 | 27 |  *      Author: heber
 | 
|---|
 | 28 |  */
 | 
|---|
 | 29 | 
 | 
|---|
 | 30 | // include config.h
 | 
|---|
 | 31 | #ifdef HAVE_CONFIG_H
 | 
|---|
 | 32 | #include <config.h>
 | 
|---|
 | 33 | #endif
 | 
|---|
 | 34 | 
 | 
|---|
 | 35 | #include "CodePatterns/MemDebug.hpp"
 | 
|---|
 | 36 | 
 | 
|---|
 | 37 | #include <iostream>
 | 
|---|
| [42c9e2] | 38 | #include <map>
 | 
|---|
 | 39 | #include <set>
 | 
|---|
 | 40 | #include <utility>
 | 
|---|
| [13a953] | 41 | 
 | 
|---|
 | 42 | #include "CheckAgainstAdjacencyFile.hpp"
 | 
|---|
 | 43 | 
 | 
|---|
| [6f0841] | 44 | #include "Atom/atom.hpp"
 | 
|---|
| [13a953] | 45 | #include "Bond/bond.hpp"
 | 
|---|
 | 46 | #include "CodePatterns/Assert.hpp"
 | 
|---|
| [255829] | 47 | #include "CodePatterns/Log.hpp"
 | 
|---|
| [ec87e4] | 48 | #include "CodePatterns/Range.hpp"
 | 
|---|
 | 49 | #include "Descriptors/AtomIdDescriptor.hpp"
 | 
|---|
| [255829] | 50 | #include "Helpers/defs.hpp"
 | 
|---|
| [ec87e4] | 51 | #include "World.hpp"
 | 
|---|
| [13a953] | 52 | 
 | 
|---|
| [3501d2] | 53 | /** Constructor of class CheckAgainstAdjacencyFile.
 | 
|---|
 | 54 |  *
 | 
|---|
 | 55 |  * \param File file to parser
 | 
|---|
 | 56 |  */
 | 
|---|
 | 57 | CheckAgainstAdjacencyFile::CheckAgainstAdjacencyFile(std::istream &File) :
 | 
|---|
| [13a953] | 58 |   NonMatchNumber(0)
 | 
|---|
 | 59 | {
 | 
|---|
| [06f41f3] | 60 |   bool status = ParseInInternalMap(File);
 | 
|---|
 | 61 |   if (!status) // remove map if failed to parse
 | 
|---|
 | 62 |     InternalAtomBondMap.clear();
 | 
|---|
| [13a953] | 63 | }
 | 
|---|
 | 64 | 
 | 
|---|
 | 65 | CheckAgainstAdjacencyFile::~CheckAgainstAdjacencyFile()
 | 
|---|
| [06f41f3] | 66 | {}
 | 
|---|
| [13a953] | 67 | 
 | 
|---|
| [ec87e4] | 68 | /** Parses the bond partners of each atom from an external file into \a AtomBondMap.
 | 
|---|
 | 69 |  *
 | 
|---|
 | 70 |  * @param File file to parse
 | 
|---|
 | 71 |  * @return true - everything ok, false - error while parsing
 | 
|---|
| [13a953] | 72 |  */
 | 
|---|
| [06f41f3] | 73 | bool CheckAgainstAdjacencyFile::ParseInInternalMap(std::istream &File)
 | 
|---|
| [13a953] | 74 | {
 | 
|---|
 | 75 |   if (File.fail()) {
 | 
|---|
 | 76 |     LOG(1, "STATUS: Adjacency file not found." << endl);
 | 
|---|
 | 77 |     return false;
 | 
|---|
 | 78 |   }
 | 
|---|
 | 79 | 
 | 
|---|
| [06f41f3] | 80 |   InternalAtomBondMap.clear();
 | 
|---|
| [13a953] | 81 |   char buffer[MAXSTRINGSIZE];
 | 
|---|
 | 82 |   int tmp;
 | 
|---|
 | 83 |   // Parse the file line by line and count the bonds
 | 
|---|
 | 84 |   while (!File.eof()) {
 | 
|---|
 | 85 |     File.getline(buffer, MAXSTRINGSIZE);
 | 
|---|
 | 86 |     stringstream line;
 | 
|---|
 | 87 |     line.str(buffer);
 | 
|---|
 | 88 |     int AtomNr = -1;
 | 
|---|
 | 89 |     line >> AtomNr;
 | 
|---|
 | 90 |     // parse into structure
 | 
|---|
| [52ed5b] | 91 |     if (AtomNr > 0) {
 | 
|---|
 | 92 |       const atom *Walker = World::getInstance().getAtom(AtomById(AtomNr-1));
 | 
|---|
| [ec87e4] | 93 |       if (Walker == NULL)
 | 
|---|
 | 94 |         return false;
 | 
|---|
| [06f41f3] | 95 |       const atomId_t WalkerId = Walker->getId();
 | 
|---|
| [ec87e4] | 96 |       // parse bond partner ids associated to AtomNr
 | 
|---|
| [13a953] | 97 |       while (line >> ws >> tmp) {
 | 
|---|
| [06f41f3] | 98 |         LOG(3, "INFO: Recognized bond partner " << tmp-1 << " for " << WalkerId << ".");
 | 
|---|
 | 99 |         InternalAtomBondMap.insert( std::make_pair(WalkerId, tmp-1) );
 | 
|---|
| [13a953] | 100 |       }
 | 
|---|
 | 101 |     } else {
 | 
|---|
| [ec87e4] | 102 |       if (AtomNr != -1) {
 | 
|---|
| [13a953] | 103 |         ELOG(2, AtomNr << " is negative.");
 | 
|---|
| [ec87e4] | 104 |         return false;
 | 
|---|
 | 105 |       }
 | 
|---|
 | 106 |     }
 | 
|---|
 | 107 |   }
 | 
|---|
 | 108 |   return true;
 | 
|---|
 | 109 | }
 | 
|---|
 | 110 | 
 | 
|---|
 | 111 | /** Fills the InternalAtomBondMap from the atoms given by the two iterators.
 | 
|---|
 | 112 |  *
 | 
|---|
| [06f41f3] | 113 |  * @param atomids set of atomic ids to check (must be global ids, i.e. from atom::getId())
 | 
|---|
| [ec87e4] | 114 |  */
 | 
|---|
| [06f41f3] | 115 | void CheckAgainstAdjacencyFile::CreateExternalMap(const atomids_t &atomids)
 | 
|---|
| [ec87e4] | 116 | {
 | 
|---|
| [06f41f3] | 117 |   ExternalAtomBondMap.clear();
 | 
|---|
| [ec87e4] | 118 |   // go through each atom in the list
 | 
|---|
| [06f41f3] | 119 |   for (atomids_t::const_iterator iter = atomids.begin(); iter != atomids.end(); ++iter) {
 | 
|---|
 | 120 |     const atomId_t WalkerId = *iter;
 | 
|---|
| [ec87e4] | 121 |     ASSERT(WalkerId != (size_t)-1,
 | 
|---|
| [06f41f3] | 122 |         "CheckAgainstAdjacencyFile::CreateExternalMap() - Walker has no id.");
 | 
|---|
 | 123 |     const atom *Walker = World::getInstance().getAtom(AtomById(WalkerId));
 | 
|---|
 | 124 |     ASSERT( Walker != NULL,
 | 
|---|
 | 125 |         "CheckAgainstAdjacencyFile::CreateExternalMap() - Walker id "+toString(*iter)
 | 
|---|
 | 126 |         +" is not associated to any of World's atoms.");
 | 
|---|
| [ec87e4] | 127 |     const BondList& ListOfBonds = Walker->getListOfBonds();
 | 
|---|
 | 128 |     // go through each of its bonds
 | 
|---|
 | 129 |     for (BondList::const_iterator Runner = ListOfBonds.begin();
 | 
|---|
 | 130 |         Runner != ListOfBonds.end();
 | 
|---|
 | 131 |         ++Runner) {
 | 
|---|
 | 132 |       const atomId_t id = (*Runner)->GetOtherAtom(Walker)->getId();
 | 
|---|
 | 133 |       ASSERT(id != (size_t)-1,
 | 
|---|
| [06f41f3] | 134 |           "CheckAgainstAdjacencyFile::CreateExternalMap() - OtherAtom has not id.");
 | 
|---|
 | 135 |       ExternalAtomBondMap.insert( std::make_pair(WalkerId, id) );
 | 
|---|
| [13a953] | 136 |     }
 | 
|---|
 | 137 |   }
 | 
|---|
| [ec87e4] | 138 | }
 | 
|---|
 | 139 | 
 | 
|---|
 | 140 | /** Checks contents of adjacency file against bond structure in structure molecule.
 | 
|---|
 | 141 |  * \return true - structure is equal, false - not equivalence
 | 
|---|
 | 142 |  */
 | 
|---|
| [06f41f3] | 143 | bool CheckAgainstAdjacencyFile::operator()(const atomids_t &atomids)
 | 
|---|
| [ec87e4] | 144 | {
 | 
|---|
| [06f41f3] | 145 |   LOG(0, "STATUS: Looking at bond structure of given ids and comparing against stored in adjacency file... ");
 | 
|---|
| [ec87e4] | 146 | 
 | 
|---|
| [06f41f3] | 147 |   // parse in external map
 | 
|---|
 | 148 |   CreateExternalMap(atomids);
 | 
|---|
| [13a953] | 149 | 
 | 
|---|
| [06f41f3] | 150 |   bool status = CompareInternalExternalMap();
 | 
|---|
| [13a953] | 151 |   if (status) { // if equal we parse the KeySetFile
 | 
|---|
 | 152 |     LOG(0, "STATUS: Equal.");
 | 
|---|
 | 153 |   } else
 | 
|---|
 | 154 |     LOG(0, "STATUS: Not equal by " << NonMatchNumber << " atoms.");
 | 
|---|
 | 155 |   return status;
 | 
|---|
 | 156 | }
 | 
|---|
| [ec87e4] | 157 | 
 | 
|---|
| [42c9e2] | 158 | CheckAgainstAdjacencyFile::KeysSet CheckAgainstAdjacencyFile::getKeys(const CheckAgainstAdjacencyFile::AtomBondRange &_range) const
 | 
|---|
| [ec87e4] | 159 | {
 | 
|---|
| [42c9e2] | 160 |   KeysSet Keys;
 | 
|---|
 | 161 |   for (AtomBondMap::const_iterator iter = _range.first;
 | 
|---|
| [ec87e4] | 162 |       iter != _range.second;
 | 
|---|
 | 163 |       ++iter) {
 | 
|---|
 | 164 |     Keys.insert( iter->first );
 | 
|---|
 | 165 |   }
 | 
|---|
 | 166 |   return Keys;
 | 
|---|
 | 167 | }
 | 
|---|
 | 168 | 
 | 
|---|
| [42c9e2] | 169 | CheckAgainstAdjacencyFile::ValuesSet CheckAgainstAdjacencyFile::getValues(const CheckAgainstAdjacencyFile::AtomBondRange&_range) const
 | 
|---|
| [ec87e4] | 170 | {
 | 
|---|
| [42c9e2] | 171 |   ValuesSet Values;
 | 
|---|
 | 172 |   for (AtomBondMap::const_iterator iter = _range.first;
 | 
|---|
| [ec87e4] | 173 |       iter != _range.second;
 | 
|---|
 | 174 |       ++iter) {
 | 
|---|
 | 175 |     Values.insert( iter->second );
 | 
|---|
 | 176 |   }
 | 
|---|
 | 177 |   return Values;
 | 
|---|
 | 178 | }
 | 
|---|
 | 179 | 
 | 
|---|
| [06f41f3] | 180 | /** Counts the number of items in the second set not present in the first set.
 | 
|---|
 | 181 |  *
 | 
|---|
 | 182 |  * \note We assume that the sets are sorted.
 | 
|---|
| [ec87e4] | 183 |  *
 | 
|---|
| [06f41f3] | 184 |  * @param firstset check set
 | 
|---|
 | 185 |  * @param secondset reference set
 | 
|---|
 | 186 |  * @return number of items in the first set that are missing in the second
 | 
|---|
| [ec87e4] | 187 |  */
 | 
|---|
 | 188 | template <class T>
 | 
|---|
| [06f41f3] | 189 | size_t getMissingItems(const T &firstset, const T &secondset)
 | 
|---|
| [ec87e4] | 190 | {
 | 
|---|
 | 191 |   size_t Mismatch = 0;
 | 
|---|
 | 192 |   typename T::const_iterator firstiter = firstset.begin();
 | 
|---|
 | 193 |   typename T::const_iterator seconditer = secondset.begin();
 | 
|---|
| [06f41f3] | 194 |   for (; (firstiter != firstset.end()) && (seconditer != secondset.end());) {
 | 
|---|
 | 195 |     if (*firstiter > *seconditer)
 | 
|---|
 | 196 |       ++seconditer;
 | 
|---|
 | 197 |     else {
 | 
|---|
 | 198 |       if (*firstiter < *seconditer)
 | 
|---|
 | 199 |         ++Mismatch;
 | 
|---|
 | 200 |       ++firstiter;
 | 
|---|
 | 201 |     }
 | 
|---|
| [ec87e4] | 202 |   }
 | 
|---|
 | 203 |   return Mismatch;
 | 
|---|
 | 204 | }
 | 
|---|
 | 205 | 
 | 
|---|
 | 206 | /** Compares InternalAtomBondMap and ExternalAtomBondMap and sets NonMatchNumber.
 | 
|---|
 | 207 |  *
 | 
|---|
 | 208 |  * @return true - both maps are the same, false - both maps diverge by NonMatchNumber counts.
 | 
|---|
 | 209 |  */
 | 
|---|
 | 210 | bool CheckAgainstAdjacencyFile::CompareInternalExternalMap()
 | 
|---|
 | 211 | {
 | 
|---|
 | 212 |   NonMatchNumber = 0;
 | 
|---|
 | 213 |   // extract keys and check whether they match
 | 
|---|
 | 214 |   const AtomBondRange Intrange(InternalAtomBondMap.begin(), InternalAtomBondMap.end());
 | 
|---|
 | 215 |   const AtomBondRange Extrange(ExternalAtomBondMap.begin(), ExternalAtomBondMap.end());
 | 
|---|
| [42c9e2] | 216 |   KeysSet InternalKeys( getKeys(Intrange) );
 | 
|---|
 | 217 |   KeysSet ExternalKeys( getKeys(Extrange) );
 | 
|---|
| [ec87e4] | 218 | 
 | 
|---|
 | 219 | //  std::cout << "InternalKeys: " << InternalKeys << std::endl;
 | 
|---|
 | 220 | //  std::cout << "ExternalKeys: " << ExternalKeys << std::endl;
 | 
|---|
 | 221 | 
 | 
|---|
 | 222 |   // check for same amount of keys
 | 
|---|
| [06f41f3] | 223 |   if (ExternalKeys.size() > InternalKeys.size()) {
 | 
|---|
 | 224 |     NonMatchNumber = (int)ExternalKeys.size() - (int)InternalKeys.size();
 | 
|---|
 | 225 |     LOG(2, "INFO: Number of external keys exceeds internal one by " << NonMatchNumber << ".");
 | 
|---|
| [ec87e4] | 226 |     return false;
 | 
|---|
 | 227 |   }
 | 
|---|
 | 228 | 
 | 
|---|
| [06f41f3] | 229 |   // check which keys are missing in the internal set
 | 
|---|
 | 230 |   NonMatchNumber = getMissingItems(ExternalKeys, InternalKeys);
 | 
|---|
| [ec87e4] | 231 | 
 | 
|---|
 | 232 |   if (NonMatchNumber != 0) {
 | 
|---|
 | 233 |     LOG(2, "INFO: " << NonMatchNumber << " keys are not the same.");
 | 
|---|
 | 234 |     return false;
 | 
|---|
 | 235 |   }
 | 
|---|
 | 236 | 
 | 
|---|
 | 237 |   // now check each map per key
 | 
|---|
| [06f41f3] | 238 |   for (KeysSet::const_iterator keyIter = ExternalKeys.begin();
 | 
|---|
 | 239 |       keyIter != ExternalKeys.end();
 | 
|---|
| [ec87e4] | 240 |       ++keyIter) {
 | 
|---|
 | 241 | //    std::cout << "Current key is " << *keyIter << std::endl;
 | 
|---|
 | 242 |     const AtomBondRange IntRange( InternalAtomBondMap.equal_range(*keyIter) );
 | 
|---|
 | 243 |     const AtomBondRange ExtRange( ExternalAtomBondMap.equal_range(*keyIter) );
 | 
|---|
| [42c9e2] | 244 |     ValuesSet InternalValues( getValues(IntRange) );
 | 
|---|
 | 245 |     ValuesSet ExternalValues( getValues(ExtRange) );
 | 
|---|
| [06f41f3] | 246 |     // throw out all values not present in ExternalKeys
 | 
|---|
 | 247 |     ValuesSet ExternalValues_temp( ExternalValues );
 | 
|---|
 | 248 |     for(KeysSet::const_iterator iter = ExternalKeys.begin();
 | 
|---|
 | 249 |         iter != ExternalKeys.end(); ++iter)
 | 
|---|
 | 250 |       ExternalValues_temp.erase(*iter);
 | 
|---|
 | 251 |     // all remaining values must be masked out
 | 
|---|
 | 252 |     for (ValuesSet::const_iterator iter = ExternalValues_temp.begin();
 | 
|---|
 | 253 |         iter != ExternalValues_temp.end(); ++iter)
 | 
|---|
 | 254 |       ExternalValues.erase(*iter);
 | 
|---|
| [ec87e4] | 255 | //    std::cout << "InternalValues: " << InternalValues << std::endl;
 | 
|---|
 | 256 | //    std::cout << "ExternalValues: " << ExternalValues << std::endl;
 | 
|---|
| [06f41f3] | 257 |     NonMatchNumber += getMissingItems(ExternalValues, InternalValues);
 | 
|---|
| [ec87e4] | 258 |   }
 | 
|---|
 | 259 |   if (NonMatchNumber != 0) {
 | 
|---|
 | 260 |     LOG(2, "INFO: " << NonMatchNumber << " keys are not the same.");
 | 
|---|
 | 261 |     return false;
 | 
|---|
 | 262 |   } else {
 | 
|---|
 | 263 |     LOG(2, "INFO: All keys are the same.");
 | 
|---|
 | 264 |     return true;
 | 
|---|
 | 265 |   }
 | 
|---|
 | 266 | }
 | 
|---|