1 | /*
|
---|
2 | * Project: MoleCuilder
|
---|
3 | * Description: creates and alters molecular systems
|
---|
4 | * Copyright (C) 2012 University of Bonn. All rights reserved.
|
---|
5 | *
|
---|
6 | *
|
---|
7 | * This file is part of MoleCuilder.
|
---|
8 | *
|
---|
9 | * MoleCuilder is free software: you can redistribute it and/or modify
|
---|
10 | * it under the terms of the GNU General Public License as published by
|
---|
11 | * the Free Software Foundation, either version 2 of the License, or
|
---|
12 | * (at your option) any later version.
|
---|
13 | *
|
---|
14 | * MoleCuilder is distributed in the hope that it will be useful,
|
---|
15 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
16 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
---|
17 | * GNU General Public License for more details.
|
---|
18 | *
|
---|
19 | * You should have received a copy of the GNU General Public License
|
---|
20 | * along with MoleCuilder. If not, see <http://www.gnu.org/licenses/>.
|
---|
21 | */
|
---|
22 |
|
---|
23 | /*
|
---|
24 | * SubsetMap.cpp
|
---|
25 | *
|
---|
26 | * Created on: Jul 3, 2012
|
---|
27 | * Author: heber
|
---|
28 | */
|
---|
29 |
|
---|
30 |
|
---|
31 | // include config.h
|
---|
32 | #ifdef HAVE_CONFIG_H
|
---|
33 | #include <config.h>
|
---|
34 | #endif
|
---|
35 |
|
---|
36 | #include "CodePatterns/MemDebug.hpp"
|
---|
37 |
|
---|
38 | #include "SubsetMap.hpp"
|
---|
39 |
|
---|
40 | #include <boost/bind.hpp>
|
---|
41 | #include <boost/foreach.hpp>
|
---|
42 | #include <algorithm>
|
---|
43 | #include <bitset>
|
---|
44 | #include <set>
|
---|
45 |
|
---|
46 | #include "CodePatterns/Log.hpp"
|
---|
47 |
|
---|
48 | SubsetMap::SubsetMap(IndexSetContainer &_container) :
|
---|
49 | tempset(new IndexSet())
|
---|
50 | {
|
---|
51 | const IndexSetContainer::Container_t &container = _container.getContainer();
|
---|
52 |
|
---|
53 | // we don't need this level-wise sorting as this is automatically achieved by specific sorting
|
---|
54 | // /// place in level-wise multimap
|
---|
55 | // typedef size_t level_t;
|
---|
56 | // // note: We use an IndexSetContainer as it is not accessed while filling it
|
---|
57 | // // also, as insert uses push_back, the IndexSetContainer is actually created
|
---|
58 | // // as sorted. Hence, the call to sort() just needs linear time (and does
|
---|
59 | // // nothing)
|
---|
60 | // typedef std::map<level_t, IndexSetContainer > IndexSetPerLevel_t;
|
---|
61 | // IndexSetPerLevel_t IndexSetPerLevel;
|
---|
62 | // for(IndexSetContainer::Container_t::const_iterator iter = container.begin();
|
---|
63 | // iter != container.end(); ++iter) {
|
---|
64 | // // key present in map?
|
---|
65 | // const size_t level = (*iter)->size();
|
---|
66 | // LOG(1, "INFO: Current set is " << **iter << " with size " << level << ".");
|
---|
67 | // IndexSetPerLevel_t::iterator leveliter = IndexSetPerLevel.find(level);
|
---|
68 | // // we have to explicitly copy the shared_ptr for insertion due to const container
|
---|
69 | // IndexSet_ptr ptr(*iter);
|
---|
70 | // if (leveliter == IndexSetPerLevel.end()) {
|
---|
71 | // LOG(2, "DEBUG: Level not present in Lookup, creating new container");
|
---|
72 | // IndexSetPerLevel.insert( std::make_pair( level, IndexSetContainer(ptr)) );
|
---|
73 | // } else {
|
---|
74 | // LOG(2, "DEBUG: Level present in Lookup, appending to container");
|
---|
75 | // leveliter->second.insert(ptr);
|
---|
76 | // }
|
---|
77 | // }
|
---|
78 |
|
---|
79 | /// go through all IndexSets
|
---|
80 | std::for_each( container.begin(), container.end(),
|
---|
81 | boost::bind(&SubsetMap::gatherSubsets, this, _1));
|
---|
82 | }
|
---|
83 |
|
---|
84 | void SubsetMap::gatherSubsets(const IndexSet_ptr &ptr) {
|
---|
85 | // get the sets size and the size of the power sets
|
---|
86 | const size_t SetSize = ptr->size();
|
---|
87 | LOG(1, "INFO: Current set to gather all subsets for is " << *ptr << " with size " << SetSize << ".");
|
---|
88 | const size_t NoPowerSubsets = getNoPowerSets(SetSize);
|
---|
89 | LOG(1, "INFO: There are " << NoPowerSubsets << " sets to check for containment.");
|
---|
90 | std::vector<IndexSet> returnsets;
|
---|
91 | // sets is the number of possible subsets to check: NotContained means still
|
---|
92 | // needs check or is not contained; Contained means is contained, or has
|
---|
93 | // already been treated via a super(sub)set.
|
---|
94 | typedef std::vector<enum ContainedState> StateOfSubsets;
|
---|
95 | StateOfSubsets sets( NoPowerSubsets, NotContained);
|
---|
96 | // we have to traverse backwards, i.e. from greatest subsets to smallest to
|
---|
97 | // make the best possible use of the subset knowledge we already have for these
|
---|
98 | // subsets of the subset.
|
---|
99 | // WARNING: last set is the set itself which must not be in IndexSetContainer due to
|
---|
100 | // cyclic structure which shared_ptr cannot resolve.
|
---|
101 | StateOfSubsets::reverse_iterator iter = sets.rbegin()+1;
|
---|
102 | for (;iter != sets.rend(); iter = std::find(iter+1, sets.rend(), NotContained)) {
|
---|
103 | // get IndexSet (get index via distance)
|
---|
104 | // NOTE: reverse iterator naturally give reverse distance, hence flip both arguments
|
---|
105 | // also, reverse iterator is off by one, see ASSERT
|
---|
106 | const size_t index = std::distance(iter, sets.rend())-1;
|
---|
107 | ASSERT( sets.at(index) == *iter,
|
---|
108 | "SubsetMap::gatherSubsets() - distance from begin to iterator is not correct.");
|
---|
109 | *tempset = getSubset(*ptr, index );
|
---|
110 | LOG(2, "INFO: Current subset is " << *tempset << " at " << index << ".");
|
---|
111 | // check whether IndexSet is contained and known
|
---|
112 | if (ptr->contains(*tempset)) {
|
---|
113 | // mark as contained
|
---|
114 | *iter = Contained;
|
---|
115 | LOG(3, "DEBUG: Marking subset as Contained.");
|
---|
116 | if (Lookup.count(tempset)) {
|
---|
117 | LOG(2, "DEBUG: Subset is present in Lookup, adding.");
|
---|
118 | returnsets.push_back(*tempset);
|
---|
119 | // if so, also add its contained sets and mark them out
|
---|
120 | const IndexSetContainer::Container_t &container = getSubsets(tempset)->getContainer();
|
---|
121 | if (container.size()) {
|
---|
122 | LOG(2, "DEBUG: Subset is also present in Lookup, adding all its subsets");
|
---|
123 | for(IndexSetContainer::Container_t::const_iterator containeriter = container.begin();
|
---|
124 | containeriter != container.end();
|
---|
125 | ++containeriter) {
|
---|
126 | const size_t subindex = getPowerSetIndex(ptr, **containeriter);
|
---|
127 | LOG(4, "INFO: Current subset of subset is " << **containeriter << " at " << subindex << ".");
|
---|
128 | if (sets[subindex] != Contained) {
|
---|
129 | LOG(5, "DEBUG: Setting power subset to Contained.");
|
---|
130 | sets[subindex] = Contained;
|
---|
131 | returnsets.push_back(**containeriter);
|
---|
132 | }
|
---|
133 | }
|
---|
134 | }
|
---|
135 | }
|
---|
136 | }
|
---|
137 | }
|
---|
138 | LOG(1, "INFO: Adding " << returnsets.size() << " sets to Lookup for set " << *ptr << ".");
|
---|
139 | Lookup.insert( std::make_pair(ptr, IndexSetContainer::ptr(new IndexSetContainer(returnsets))) );
|
---|
140 | }
|
---|
141 |
|
---|
142 | const size_t SubsetMap::getPowerSetIndex(const IndexSet_ptr &ptr, const IndexSet &subset) {
|
---|
143 | ASSERT( (ptr->size() < MAX_SETSIZE) && (subset.size() < MAX_SETSIZE),
|
---|
144 | "SubsetMap::getPowerSetIndex() - power sets of subsets must not be bigger than "
|
---|
145 | +toString((int)MAX_SETSIZE)+".");
|
---|
146 | ASSERT( ptr->contains(subset),
|
---|
147 | "SubsetMap::getPowerSetIndex() - "+(toString(*ptr))+" does not contain "
|
---|
148 | +toString(subset)+".");
|
---|
149 | std::bitset<MAX_SETSIZE> bits(0);
|
---|
150 | // go through each and search for indices present in both
|
---|
151 | IndexSet::iterator indexiter = ptr->begin();
|
---|
152 | IndexSet::iterator subindexiter = subset.begin();
|
---|
153 | for (; subindexiter != subset.end();) {
|
---|
154 | if (*indexiter == *subindexiter) {
|
---|
155 | // if matching, set bit and advance both iterators
|
---|
156 | bits.set( (size_t)std::distance(ptr->begin(), indexiter) );
|
---|
157 | ++indexiter;
|
---|
158 | ++subindexiter;
|
---|
159 | // if not, advance the iterator lacking behind
|
---|
160 | } else if ( *indexiter < *subindexiter) {
|
---|
161 | ++indexiter;
|
---|
162 | } else {
|
---|
163 | ++subindexiter;
|
---|
164 | }
|
---|
165 | }
|
---|
166 | return bits.to_ulong();
|
---|
167 | }
|
---|
168 |
|
---|
169 | IndexSet SubsetMap::getSubset(const IndexSet &_set, size_t PowerSetNo) {
|
---|
170 | ASSERT( _set.size() < MAX_SETSIZE,
|
---|
171 | "SubsetMap::getSubset() - power sets of subsets must not be bigger than "
|
---|
172 | +toString((int)MAX_SETSIZE)+".");
|
---|
173 | ASSERT((PowerSetNo >= 0) && (PowerSetNo < getNoPowerSets(_set.size())),
|
---|
174 | "SubsetMap::getSubset() - Power set index "+toString(PowerSetNo)+" is out of range.");
|
---|
175 | std::bitset<MAX_SETSIZE> bits(PowerSetNo);
|
---|
176 | // place index into container with random access
|
---|
177 | std::vector<IndexSet::value_type> indices(_set.begin(), _set.end());
|
---|
178 | IndexSet indexset;
|
---|
179 | // go through each bit and insert if 1, not if 0
|
---|
180 | for (size_t index=0; index < indices.size(); ++index)
|
---|
181 | if (bits[index])
|
---|
182 | indexset.insert(indices[index]);
|
---|
183 | return indexset;
|
---|
184 | }
|
---|
185 |
|
---|
186 | size_t SubsetMap::getMaximumSubsetLevel() const
|
---|
187 | {
|
---|
188 | // last one is super set, hence, the one before has largest subset size
|
---|
189 | Lookup_t::const_iterator iter = --Lookup.end();
|
---|
190 | --iter;
|
---|
191 | return iter->first->size();
|
---|
192 | }
|
---|
193 |
|
---|
194 | size_t SubsetMap::getMaximumSetLevel() const
|
---|
195 | {
|
---|
196 | // last one is super set
|
---|
197 | Lookup_t::const_iterator iter = --Lookup.end();
|
---|
198 | return iter->first->size();
|
---|
199 | }
|
---|