SoPlex Doxygen Documentation
datahashtable.h
Go to the documentation of this file.
1 /* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2 /* */
3 /* This file is part of the class library */
4 /* SoPlex --- the Sequential object-oriented simPlex. */
5 /* */
6 /* Copyright (C) 1996-2012 Konrad-Zuse-Zentrum */
7 /* fuer Informationstechnik Berlin */
8 /* */
9 /* SoPlex is distributed under the terms of the ZIB Academic Licence. */
10 /* */
11 /* You should have received a copy of the ZIB Academic License */
12 /* along with SoPlex; see the file COPYING. If not email to soplex@zib.de. */
13 /* */
14 /* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
15 
16 /**@file datahashtable.h
17  * @brief Generic hash table for data objects.
18  */
19 #ifndef _DATAHASHTABLE_H_
20 #define _DATAHASHTABLE_H_
21 
22 #include <iostream>
23 #include <assert.h>
24 
25 #include "spxdefines.h"
26 
27 namespace soplex
28 {
29 /**@brief Generic hash table for data objects.
30  @ingroup Elementary
31 
32  Class DataHashTable provides a generic hash table for
33  \ref DataObjects "Data Objects",
34  i.e., a map that maps arguments called \a HashItems to values called \a Infos.
35  HashItem and Info types are passed as template arguments. HashItems
36  must provide a comparison operator==(). Furthermore, both the HashItem and
37  Info must be data objects in the sense that the assignment operator is
38  equivalent to a <tt>memcpy()</tt> of the structure and no destructor is
39  required.
40 
41  The construction of a DataHashTable requires a \em hash \em function that
42  assigns an integer value to every HashItem. Provided this, pairs of a
43  HashItem and a Info can be added to the DataHashTable. No more
44  than one Info can be assigned to the same HashItem at a time. The Info
45  to a HashItem can be accessed through the subscript operator[]() with
46  the Info object as a subscript.
47 
48  The maximum number of elemens a DataHashTable can hold can be
49  specified upon construction and may be reset with reMax() later on.
50  Further, a value hash size value is required. This value must be less then
51  the maximum number of elements and must not have a common dominator with
52  the maximum number of elements. If not specified explicitely, it
53  is set automatically to a reasonable value.
54 
55  The implementation relies on an array of DataHashTable::Element%s, from
56  now on referred to as elements. Upon construction, all elements are
57  marked as \c FREE. When an entry is added
58  to the DataHashTable, the hash value is computed by calling #m_hashfun
59  for its HashItem. If this array element is unused, it is
60  taken right away. Otherwise, the array index is incremented by
61  the hash size (modulo the element array size()) until an unused element
62  is found.
63 
64  Removing elements is simply done by marking it as \c RELEASED. Hence,
65  when searching for an element, the search loop may not stop, when a
66  \c RELEASED element is encountered. However, such an element may be
67  reused when adding a new element to the DataHashTable.
68 
69  Further, memory management with resizing of the element array is
70  straight forward.
71 */
72 template < class HashItem, class Info >
74 {
75 private:
76 
77  //-----------------------------------
78  /**@name Types */
79  //@{
80  /// template class for elements stored in the hash table
81  template < class ElemHashItem, class ElemInfo >
82  class Element
83  {
84  public:
85  ///
86  ElemHashItem item;
87  ///
88  ElemInfo info;
89  /// States of an element
90  enum states
91  {
92  FREE, ///< element has never been used
93  RELEASED, ///< element had been used, but released
94  USED ///< element is in use
95  } stat;
96  };
97  typedef Element< HashItem, Info > Elem;
98  //@}
99 
100  //-----------------------------------
101  /**@name Data */
102  //@{
103  /// stores all elements of the hash table
105  /// increment added to hash index, if allready used
107  /// current number of entries in the hash table
108  int m_used;
109  /// pointer to hash function (mapping: \a HashItem -> int)
110  int (*m_hashfun) (const HashItem*);
111  /// memory is \ref soplex::DataHashTable::reMax() "reMax()"ed by this factor if a new element does't fit
113  //@}
114 
115 public:
116 
117  //-----------------------------------
118  /**@name Access / modification */
119  //@{
120  /// Is item \p h present in DataHashTable?
121  bool has(const HashItem& h) const
122  {
123  return index(h) >= 0;
124  }
125 
126  /// returns const pointer to \a Info of \a HashItem \p h or 0,
127  /// if item is not found.
128  /** Returns a pointer to \a Info component of hash element \p h or a zero
129  * pointer if element \p h is not in the table.
130  */
131  const Info* get(const HashItem& h) const
132  {
133  int i = index(h);
134 
135  return (i >= 0) ? &m_elem[i].info : 0;
136  }
137  /// references \a Info of \a HashItem \p h.
138  /** Index operator for accessing the \a Info associated to
139  * \a HashItem \p h. It is required that \p h belongs to the
140  * DataHashTable, otherwise it core dumps. Methods has() or
141  * get() can be used for inquiring wheater \p h belongs to the
142  * DataHashTable or not.
143  */
144  const Info& operator[](const HashItem& h) const
145  {
146  assert(has(h));
147 
148  return m_elem[index(h)].info;
149  }
150  /// adds a new entry to the hash table.
151  /** Adds a new entry consisting of \a HashItem \p h and \a Info \p info to the
152  * DataHashTable. No entry with HashItem \p h must be in the
153  * DataHashTable yet. After completion, \p info may be accessed via get() or
154  * operator[]() with \p h as parameter. The DataHashTable is #reMax()%ed
155  * if it becomes neccessary.
156  */
157  void add(const HashItem& h, const Info& info)
158  {
159  assert(!has(h));
160 
161  if (m_used >= m_elem.size())
162  reMax(int(m_memfactor * m_used) + 1);
163 
164  assert(m_used < m_elem.size());
165 
166  int i;
167 
168  for(i = (*m_hashfun)(&h) % m_elem.size();
169  m_elem[i].stat == Elem::USED;
170  i = (i + m_hashsize) % m_elem.size())
171  ;
172 
173  assert(m_elem[i].stat != Elem::USED);
174 
175  m_elem[i].stat = Elem::USED;
176  m_elem[i].info = info;
177  m_elem[i].item = h;
178 
179  m_used++;
180 
181  assert(has(h));
182  }
183 
184  /// remove \a HashItem \p h from the DataHashTable.
185  void remove(const HashItem& h)
186  {
187  assert(has(h));
188  m_elem[index(h)].stat = Elem::RELEASED;
189  m_used--;
190  assert(!has(h));
191  }
192 
193  /// remove all entries from DataHashTable.
194  void clear()
195  {
196  for(int i = 0; i < m_elem.size(); i++)
197  m_elem[i].stat = Elem::FREE;
198  m_used = 0;
199  }
200  /// reset size of the DataHashTable.
201  /** Reset the maximum number of elements of a DataHashTable to \p newSize.
202  * However, if \p newSize < #m_used, it is resized to #m_used only.
203  * If \p newHashSize < 1, a new hash size is computed automatically.
204  * Otherwise, the specified value will be taken.
205  */
206  void reMax (int newSize = -1, int newHashSize = 0)
207  {
209 
210  m_elem.reSize(newSize < m_used ? m_used : newSize);
211 
212  clear();
213 
214  m_hashsize = (newHashSize < 1) ? autoHashSize() : newHashSize;
215 
216  for(int i = 0; i < save.size(); i++)
217  if (save[i].stat == Elem::USED)
218  add(save[i].item, save[i].info);
219  }
220  //@}
221 
222  //-----------------------------------
223  /**@name Debugging */
224  //@{
225  /// checks whether DataHashTable is consistent
226  bool isConsistent() const
227  {
228 #ifdef ENABLE_CONSISTENCY_CHECKS
229  int total = 0;
230 
231  for(int i = 0; i < m_elem.size(); i++)
232  {
233  if (m_elem[i].stat == Elem::USED)
234  {
235  total++;
236  if (!has(m_elem[i].item))
237  return MSGinconsistent("DataHashTable");
238  }
239  }
240  if (total != m_used)
241  return MSGinconsistent("DataHashTable");
242 
243  return m_elem.isConsistent();
244 #else
245  return true;
246 #endif
247  }
248  //@}
249 
250  //-----------------------------------
251  /**@name Construction / destruction */
252  //@{
253  /// default constructor.
254  /** Allocates a DataHashTable for \p maxsize entries using \p hashfun
255  * as hash function. If \p hashsize > 0, #m_hashsize is set to the
256  * specified value, otherwise a suitable hash size is computed
257  * automatically. Parameter \p factor is used for memory management:
258  * If more than \p maxsize entries are added to the DataHashTable, it
259  * will automatically be #reMax()%ed by a factor of \p factor.
260  *
261  * @param hashfun pointer to hash function.
262  * @param maxsize maximum number of hash elements.
263  * @param hashsize hash size.
264  * @param factor factor for increasing data block.
265  */
266  explicit DataHashTable(
267  int (*hashfun)(const HashItem*),
268  int maxsize = 256,
269  int hashsize = 0,
270  Real factor = 2.0)
271  : m_elem(maxsize)
272  , m_hashfun(hashfun)
273  , m_memfactor(factor)
274  {
275  clear();
276 
277  m_hashsize = (hashsize < 1) ? autoHashSize() : hashsize;
278 
279  assert(m_memfactor > 1.0);
280  assert(isConsistent());
281  }
282 
283  /// assignment operator.
285  {
286  m_elem = base.m_elem;
287  m_hashfun = base.m_hashfun;
288  m_memfactor = base.m_memfactor;
289  m_used = base.m_used;
290  m_hashsize = base.m_hashsize;
291 
292  assert(m_memfactor > 1.0);
293  assert(isConsistent());
294  return *this;
295  }
296 
297  /// copy constructor.
299  : m_elem(base.m_elem)
300  , m_hashfun(base.m_hashfun)
301  , m_memfactor(base.m_memfactor)
302  , m_used(base.m_used)
303  , m_hashsize(base.m_hashsize)
304  {
305  assert(m_memfactor > 1.0);
306  assert(isConsistent());
307  }
308  //@}
309 
310 private:
311 
312  //-----------------------------------
313  /**@name Helpers */
314  //@{
315  /// automatically computes a good \ref soplex::DataHashTable::m_hashsize "m_hashsize".
316  /** Computes a good #m_hashsize as the product of all prime numbers
317  * not divisors of the number of elements that are <=
318  * the maximum divisor of the number of elemens.
319  * @return good value for #m_hashsize
320  */
321  int autoHashSize() const
322  {
323  DataArray< bool > prime(m_elem.size());
324  int hashsize = 1;
325  int maxsize = m_elem.size();
326  int i;
327 
328  for (i = 2; i < maxsize; i++)
329  prime[i] = true;
330 
331  for (i = 2; i < maxsize; ++i)
332  {
333  if (prime[i])
334  {
335  for (int j = i; j < maxsize; j += i)
336  prime[j] = false;
337 
338  if (m_elem.size() % i != 0)
339  {
340  hashsize *= i;
341 
342  if (hashsize > maxsize)
343  {
344  hashsize /= i;
345  break;
346  }
347  }
348  }
349  }
350  return hashsize;
351  }
352 
353  /// returns hash index of \a HashItem \p h or -1, if \p h is not present.
354  /** Using the hash function #m_hashfun, the hash value of \p h
355  * is calculated.
356  * Starting with this hash index, every #m_hashsize%-th element is
357  * compared with \p h until \p h is found or all elements have been checked.
358  *
359  * @param h \a HashItem, for which the hash index should be calculated
360  * @return hash index of \p h or -1,
361  * if \p h is not a member of the hash table
362  */
363  int index(const HashItem& h) const
364  {
365  if (m_used == 0)
366  return -1;
367 
368  assert(m_elem.size() > 0);
369 
370  int i = (*m_hashfun)(&h) % m_elem.size();
371  int j = i;
372 
373  while(m_elem[i].stat != Elem::FREE)
374  {
375  if ( (m_elem[i].stat == Elem::USED)
376  && (m_elem[i].item == h))
377  return i;
378 
379  i = (i + m_hashsize) % m_elem.size();
380 
381  if (i == j)
382  break;
383  }
384  return -1;
385  }
386  //@}
387 
388 };
389 } // namespace soplex
390 #endif // _DATAHASHTABLE_H_
391 
392 //-----------------------------------------------------------------------------
393 //Emacs Local Variables:
394 //Emacs mode:c++
395 //Emacs c-basic-offset:3
396 //Emacs tab-width:8
397 //Emacs indent-tabs-mode:nil
398 //Emacs End:
399 //-----------------------------------------------------------------------------
400 
401 
402 
403 
404