Home | History | Annotate | Download | only in include
      1 
      2 /*--------------------------------------------------------------------*/
      3 /*--- OSet: a fast data structure with no dups.    pub_tool_oset.h ---*/
      4 /*--------------------------------------------------------------------*/
      5 
      6 /*
      7    This file is part of Valgrind, a dynamic binary instrumentation
      8    framework.
      9 
     10    Copyright (C) 2005-2013 Nicholas Nethercote
     11       njn (at) valgrind.org
     12 
     13    This program is free software; you can redistribute it and/or
     14    modify it under the terms of the GNU General Public License as
     15    published by the Free Software Foundation; either version 2 of the
     16    License, or (at your option) any later version.
     17 
     18    This program is distributed in the hope that it will be useful, but
     19    WITHOUT ANY WARRANTY; without even the implied warranty of
     20    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
     21    General Public License for more details.
     22 
     23    You should have received a copy of the GNU General Public License
     24    along with this program; if not, write to the Free Software
     25    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
     26    02111-1307, USA.
     27 
     28    The GNU General Public License is contained in the file COPYING.
     29 */
     30 
     31 #ifndef __PUB_TOOL_OSET_H
     32 #define __PUB_TOOL_OSET_H
     33 
     34 #include "pub_tool_basics.h"   // Word
     35 
     36 // This module implements an ordered set, a data structure with fast
     37 // (eg. amortised log(n) or better) insertion, lookup and deletion of
     38 // elements.  It does not allow duplicates, and will assert if you insert a
     39 // duplicate to an OSet.
     40 //
     41 // It has two interfaces.
     42 //
     43 // - The "OSetWord_" interface provides an easier-to-use interface for the
     44 //   case where you just want to store UWord-sized values.  The user
     45 //   provides the allocation and deallocation functions, and possibly a
     46 //   comparison function.
     47 //
     48 // - The "OSetGen_" interface provides a totally generic interface, which
     49 //   allows any kind of structure to be put into the set.  The user provides
     50 //   the allocation and deallocation functions.  Also, each element has a
     51 //   key, which the lookup is done with.  The key may be the whole element
     52 //   (eg. in an OSet of integers, each integer serves both as an element and
     53 //   a key), or it may be only part of it (eg. if the key is a single field
     54 //   in a struct).  The user can provide a function that compares an element
     55 //   with a key;  this is very flexible, and with the right comparison
     56 //   function even a (non-overlapping) interval list can be created.  But
     57 //   the cost of calling a function for every comparison can be high during
     58 //   lookup.  If no comparison function is provided, we assume that keys are
     59 //   unsigned words, and that the key is the first word in each
     60 //   element.  This fast comparison is suitable for an OSet containing
     61 //   structs where the first element is an Addr, for example.
     62 //   Do not assume fast comparison works properly with signed words.
     63 //   A.o. iterating over the values will not return them in the correct
     64 //   order.
     65 //
     66 // Each OSet interface also has an iterator, which makes it simple to
     67 // traverse all the nodes in order.  Note that the iterator maintains state
     68 // and so is non-reentrant.
     69 //
     70 // Note that once you insert an element into an OSet, if you modify any part
     71 // of it looked at by your cmp() function, this may cause incorrect
     72 // behaviour as the sorted order maintained will be wrong.
     73 
     74 /*--------------------------------------------------------------------*/
     75 /*--- Types                                                        ---*/
     76 /*--------------------------------------------------------------------*/
     77 
     78 typedef struct _OSet     OSet;
     79 
     80 // - Cmp:   returns -1, 0 or 1 if key is <, == or > elem.
     81 // - Alloc: allocates a chunk of memory.
     82 // - Free:  frees a chunk of memory allocated with Alloc.
     83 
     84 typedef Word  (*OSetCmp_t)         ( const void* key, const void* elem );
     85 typedef void* (*OSetAlloc_t)       ( const HChar* cc, SizeT szB );
     86 typedef void  (*OSetFree_t)        ( void* p );
     87 
     88 /*--------------------------------------------------------------------*/
     89 /*--- Creating and destroying OSets (UWord)                        ---*/
     90 /*--------------------------------------------------------------------*/
     91 
     92 // * Create: allocates and initialises the OSet.  Never returns NULL.
     93 //   Parameters:
     94 //   - alloc_fn  The allocation function used internally for allocating the
     95 //               OSet and all its nodes. It must not return NULL (that is,
     96 //               if it returns it must have succeeded.)
     97 //   - cc        Cost centre string used by 'alloc'.
     98 //   - free_fn   The deallocation function used internally for freeing nodes
     99 //               called by VG_(OSetWord_Destroy)().
    100 //
    101 // * Destroy: frees all nodes in the table, plus the memory used by
    102 //   the table itself.  The passed-in function is called on each node first
    103 //   to allow the destruction of any attached resources;  if NULL it is not
    104 //   called.
    105 
    106 extern OSet* VG_(OSetWord_Create) ( OSetAlloc_t alloc_fn, const HChar* cc,
    107                                     OSetFree_t free_fn );
    108 extern void  VG_(OSetWord_Destroy) ( OSet* os );
    109 
    110 /*--------------------------------------------------------------------*/
    111 /*--- Operations on OSets (UWord)                                  ---*/
    112 /*--------------------------------------------------------------------*/
    113 
    114 // In everything that follows, the parameter 'key' is always the *address*
    115 // of the key, and 'elem' is *address* of the elem, as are the return values
    116 // of the functions that return elems.
    117 //
    118 // * Size: The number of elements in the set.
    119 //
    120 // * Contains: Determines if the value is in the set.
    121 //
    122 // * Insert: Inserts a new element into the set.  Duplicates are forbidden,
    123 //   and will cause assertion failures.
    124 //
    125 // * Remove: Removes the value from the set, if present.  Returns a Bool
    126 //   indicating if the value was removed.
    127 //
    128 // * ResetIter: Each OSet has an iterator.  This resets it to point to the
    129 //   first element in the OSet.
    130 //
    131 // * Next: Copies the next value according to the OSet's iterator into &val,
    132 //   advances the iterator by one, and returns True;  the elements are
    133 //   visited in increasing order of unsigned words (UWord).  Or, returns
    134 //   False if the iterator has reached the set's end.
    135 //
    136 //   You can thus iterate in order through a set like this:
    137 //
    138 //     Word val;
    139 //     VG_(OSetWord_ResetIter)(oset);
    140 //     while ( VG_(OSetWord_Next)(oset, &val) ) {
    141 //        ... do stuff with 'val' ...
    142 //     }
    143 //
    144 //   Note that iterators are cleared any time an element is inserted or
    145 //   removed from the OSet, to avoid possible mayhem caused by the iterator
    146 //   getting out of sync with the OSet's contents.  "Cleared" means that
    147 //   they will return False if VG_(OSetWord_Next)() is called without an
    148 //   intervening call to VG_(OSetWord_ResetIter)().
    149 
    150 extern Word  VG_(OSetWord_Size)         ( const OSet* os );
    151 extern void  VG_(OSetWord_Insert)       ( OSet* os, UWord val );
    152 extern Bool  VG_(OSetWord_Contains)     ( const OSet* os, UWord val );
    153 extern Bool  VG_(OSetWord_Remove)       ( OSet* os, UWord val );
    154 extern void  VG_(OSetWord_ResetIter)    ( OSet* os );
    155 extern Bool  VG_(OSetWord_Next)         ( OSet* os, /*OUT*/UWord* val );
    156 
    157 
    158 /*--------------------------------------------------------------------*/
    159 /*--- Creating and destroying OSets and OSet members (Gen)         ---*/
    160 /*--------------------------------------------------------------------*/
    161 
    162 // * Create: allocates and initialises the OSet. Never returns NULL.
    163 //   Parameters:
    164 //   - keyOff    The offset of the key within the element.
    165 //   - cmp       The comparison function between keys and elements, or NULL
    166 //               if the OSet should use fast comparisons.
    167 //   - alloc_fn  The allocation function used for allocating the OSet itself;
    168 //               It must not return NULL (that is, if it returns it must
    169 //               have succeeded.)
    170 //               If a pool allocator is used, it's called to allocate pool of
    171 //               nodes.
    172 //               If no pool allocator is used, it's called for each
    173 //               invocation of VG_(OSetGen_AllocNode)().
    174 //   - cc        Cost centre string used by 'alloc'.
    175 //   - free_fn   If no pool allocator is used, this is the deallocation
    176 //               function used by VG_(OSetGen_FreeNode)() and
    177 //               VG_(OSetGen_Destroy)().
    178 //               If a pool allocator is used, the memory used by the nodes is
    179 //               deallocated when the pool is deleted.
    180 //   (for more details about pool allocators, see pub_tool_poolalloc.h).
    181 //
    182 //
    183 //   If cmp is NULL, keyOff must be zero.  This is checked.
    184 //
    185 // * Destroy: frees all nodes in the table, plus the memory used by
    186 //   the table itself.  The passed-in function is called on each node first
    187 //   to allow the destruction of any attached resources;  if NULL it is not
    188 //   called.
    189 //
    190 // * AllocNode: Allocate and zero memory for a node to go into the OSet.
    191 //   If a pool allocator is used, it uses the pool allocator to allocate a node.
    192 //   Otherwise, uses the alloc function given to VG_(OSetGen_Create)() to
    193 //   allocate a node which is big enough for both an element and the OSet
    194 //   metadata.
    195 //   Not all elements in one OSet have to be the same size.
    196 //   However, if a pool allocator is used, elements will all have a size equal
    197 //   to the max user data size given at creation + the node meta data size.
    198 //
    199 //   Note that the element allocated will be at most word-aligned, which may
    200 //   be less aligned than the element type would normally be.
    201 //
    202 // * FreeNode: Deallocate a node allocated with OSetGen_AllocNode().  Using
    203 //   a deallocation function (such as VG_(free)()) directly will likely
    204 //   lead to assertions in Valgrind's allocator.
    205 
    206 extern OSet* VG_(OSetGen_Create)    ( PtrdiffT keyOff, OSetCmp_t cmp,
    207                                       OSetAlloc_t alloc_fn, const HChar* cc,
    208                                       OSetFree_t free_fn);
    209 
    210 
    211 extern OSet* VG_(OSetGen_Create_With_Pool)    ( PtrdiffT keyOff, OSetCmp_t cmp,
    212                                                 OSetAlloc_t alloc_fn,
    213                                                 const HChar* cc,
    214                                                 OSetFree_t free_fn,
    215                                                 SizeT poolSize,
    216                                                 SizeT maxEltSize);
    217 // Same as VG_(OSetGen_Create) but created OSet will use a pool allocator to
    218 // allocate the nodes.
    219 // The node size is the sum of a fixed small meta data size needed for OSet
    220 // + the size of the user data element.
    221 // The maximum size for the user data element is specified by maxEltSize.
    222 // (if poolSize is 0, maxEltSize is not relevant for the OSet).
    223 // It is interesting to use a pool allocator when an OSet has many elements,
    224 // and these elements have a small fixed size, or have a variable size, but
    225 // always <= than a (small) maximum value.
    226 // In such a case, allocating the nodes in pools reduces significantly
    227 // the memory overhead needed by each node.
    228 // When a node is freed (i.e. OSetGen_Freenode is called), the node is
    229 // put back in the pool allocator free list (for sub-sequent re-use by
    230 // OSetGen_AllocNode). Note that the pool memory is only released when
    231 // the pool is destroyed : calls to VG_(OSetGen_Free) do not cause
    232 // any calls to OSetFree_t _free function.
    233 // If there are several OSet managing similar such elements, it might be
    234 // interesting to use a shared pool for these OSet.
    235 // To have multiple OSets sharing a pool allocator, create the first OSet
    236 // with VG_(OSetGen_Create_With_Pool). Create subsequent OSet with
    237 // VG_(OSetGen_EmptyClone).
    238 
    239 extern void  VG_(OSetGen_Destroy)   ( OSet* os );
    240 extern void* VG_(OSetGen_AllocNode) ( const OSet* os, SizeT elemSize );
    241 extern void  VG_(OSetGen_FreeNode)  ( const OSet* os, void* elem );
    242 
    243 extern OSet* VG_(OSetGen_EmptyClone) (const OSet* os);
    244 // Creates a new empty OSet.
    245 // The new OSet will have the same characteristics as os.
    246 // If os uses a pool allocator, this pool allocator will be shared with
    247 // the new OSet. A shared pool allocator is only deleted (and its memory is
    248 // released) when the last OSet using the shared pool is destroyed.
    249 
    250 /*-------------------------------------------------------------------*/
    251 /*--- Operations on OSets (Gen)                                    ---*/
    252 /*--------------------------------------------------------------------*/
    253 
    254 // In everything that follows, the parameter 'key' is always the *address*
    255 // of the key, and 'elem' is *address* of the elem, as are the return values
    256 // of the functions that return elems.
    257 //
    258 // * Size: The number of elements in the set.
    259 //
    260 // * Insert: Inserts a new element into the set.  Note that 'elem' must
    261 //   have been allocated using VG_(OSetGen_AllocNode)(), otherwise you will
    262 //   get assertion failures about "bad magic".  Duplicates are forbidden,
    263 //   and will also cause assertion failures.
    264 //
    265 // * Contains: Determines if any element in the OSet matches the key.
    266 //
    267 // * Lookup: Returns a pointer to the element matching the key, if there is
    268 //   one, otherwise returns NULL.
    269 //
    270 // * LookupWithCmp: Like Lookup, but you specify the comparison function,
    271 //   which overrides the OSet's normal one.
    272 //
    273 // * Remove: Removes the element matching the key, if there is one.  Returns
    274 //   NULL if no element matches the key.
    275 //
    276 // * ResetIter: Each OSet has an iterator.  This resets it to point to the
    277 //   first element in the OSet.
    278 //
    279 // * ResetIterAt: Like ResetIter, but instead of resetting the iterator to the
    280 //   smallest element, it resets the iterator to point to the smallest element
    281 //   in the set whose key is greater-than-or-equal to the given key.  (In many
    282 //   cases this will be the element whose key equals that of the given key.)
    283 //
    284 // * Next: Returns a pointer to the element pointed to by the OSet's
    285 //   iterator, and advances the iterator by one;  the elements are visited
    286 //   in order.  Or, returns NULL if the iterator has reached the OSet's end.
    287 //
    288 //   You can thus iterate in order through a set like this:
    289 //
    290 //     VG_(OSetGen_ResetIter)(oset);
    291 //     while ( (elem = VG_(OSetGen_Next)(oset)) ) {
    292 //        ... do stuff with 'elem' ...
    293 //     }
    294 //
    295 //   Note that iterators are cleared any time an element is inserted or
    296 //   removed from the OSet, to avoid possible mayhem caused by the iterator
    297 //   getting out of sync with the OSet's contents.  "Cleared" means that
    298 //   they will return NULL if VG_(OSetGen_Next)() is called without an
    299 //   intervening call to VG_(OSetGen_ResetIter)().
    300 
    301 extern Word  VG_(OSetGen_Size)         ( const OSet* os );
    302 extern void  VG_(OSetGen_Insert)       ( OSet* os, void* elem );
    303 extern Bool  VG_(OSetGen_Contains)     ( const OSet* os, const void* key );
    304 extern void* VG_(OSetGen_Lookup)       ( const OSet* os, const void* key );
    305 extern void* VG_(OSetGen_LookupWithCmp)( OSet* os,
    306                                          const void* key, OSetCmp_t cmp );
    307 extern void* VG_(OSetGen_Remove)       ( OSet* os, const void* key );
    308 extern void  VG_(OSetGen_ResetIter)    ( OSet* os );
    309 extern void  VG_(OSetGen_ResetIterAt)  ( OSet* os, const void* key );
    310 extern void* VG_(OSetGen_Next)         ( OSet* os );
    311 
    312 
    313 #endif   // __PUB_TOOL_OSET_H
    314 
    315 /*--------------------------------------------------------------------*/
    316 /*--- end                                                          ---*/
    317 /*--------------------------------------------------------------------*/
    318