helgrind/hg_wordset.c - platform/external/valgrind - Gitiles


 /*--------------------------------------------------------------------*/
 /*--- Sets of words, with unique set identifiers.                  ---*/
 /*---                                                 hg_wordset.c ---*/
 /*--------------------------------------------------------------------*/

 /*
    This file is part of Helgrind, a Valgrind tool for detecting errors
    in threaded programs.

    Copyright (C) 2007-2008 OpenWorks LLP
        info@open-works.co.uk

    This program is free software; you can redistribute it and/or
    modify it under the terms of the GNU General Public License as
    published by the Free Software Foundation; either version 2 of the
    License, or (at your option) any later version.

    This program is distributed in the hope that it will be useful, but
    WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
    02111-1307, USA.

    The GNU General Public License is contained in the file COPYING.

    Neither the names of the U.S. Department of Energy nor the
    University of California nor the names of its contributors may be
    used to endorse or promote products derived from this software
    without prior written permission.
 */

 #include "pub_tool_basics.h"
 #include "pub_tool_libcassert.h"
 #include "pub_tool_libcbase.h"
 #include "pub_tool_libcprint.h"
 #include "pub_tool_threadstate.h"
 #include "pub_tool_wordfm.h"

 #include "hg_basics.h"
 #include "hg_wordset.h"     /* self */

 //------------------------------------------------------------------//
 //--- Word Cache                                                 ---//
 //------------------------------------------------------------------//

 typedef
    struct { UWord arg1; UWord arg2; UWord res; }
    WCacheEnt;

 /* Each cache is a fixed sized array of N_WCACHE_STAT_MAX entries.
    However only the first .dynMax are used.  This is because at some
    point, expanding the cache further overall gives a slowdown because
    searching more entries more than negates any performance advantage
    from caching those entries in the first place.  Hence use .dynMax
    to allow the size of the cache(s) to be set differently for each
    different WordSetU. */
 #define N_WCACHE_STAT_MAX 32
 typedef
    struct {
       WCacheEnt ent[N_WCACHE_STAT_MAX];
       UWord     dynMax; /* 1 .. N_WCACHE_STAT_MAX inclusive */
       UWord     inUse;  /* 0 .. dynMax inclusive */
    }
    WCache;

 #define WCache_INIT(_zzcache,_zzdynmax)                              \
    do {                                                              \
       tl_assert((_zzdynmax) >= 1);                                   \
       tl_assert((_zzdynmax) <= N_WCACHE_STAT_MAX);                   \
       (_zzcache).dynMax = (_zzdynmax);                               \
       (_zzcache).inUse = 0;                                          \
    } while (0)

 #define WCache_LOOKUP_AND_RETURN(_retty,_zzcache,_zzarg1,_zzarg2)    \
    do {                                                              \
       UWord   _i;                                                    \
       UWord   _arg1  = (UWord)(_zzarg1);                             \
       UWord   _arg2  = (UWord)(_zzarg2);                             \
       WCache* _cache = &(_zzcache);                                  \
       tl_assert(_cache->dynMax >= 1);                                \
       tl_assert(_cache->dynMax <= N_WCACHE_STAT_MAX);                \
       tl_assert(_cache->inUse >= 0);                                 \
       tl_assert(_cache->inUse <= _cache->dynMax);                    \
       if (_cache->inUse > 0) {                                       \
          if (_cache->ent[0].arg1 == _arg1                            \
              && _cache->ent[0].arg2 == _arg2)                        \
             return (_retty)_cache->ent[0].res;                       \
          for (_i = 1; _i < _cache->inUse; _i++) {                    \
             if (_cache->ent[_i].arg1 == _arg1                        \
                 && _cache->ent[_i].arg2 == _arg2) {                  \
                WCacheEnt tmp     = _cache->ent[_i-1];                \
                _cache->ent[_i-1] = _cache->ent[_i];                  \
                _cache->ent[_i]   = tmp;                              \
                return (_retty)_cache->ent[_i-1].res;                 \
             }                                                        \
          }                                                           \
       }                                                              \
    } while (0)

 #define WCache_UPDATE(_zzcache,_zzarg1,_zzarg2,_zzresult)            \
    do {                                                              \
       Word    _i;                                                    \
       UWord   _arg1  = (UWord)(_zzarg1);                             \
       UWord   _arg2  = (UWord)(_zzarg2);                             \
       UWord   _res   = (UWord)(_zzresult);                           \
       WCache* _cache = &(_zzcache);                                  \
       tl_assert(_cache->dynMax >= 1);                                \
       tl_assert(_cache->dynMax <= N_WCACHE_STAT_MAX);                \
       tl_assert(_cache->inUse >= 0);                                 \
       tl_assert(_cache->inUse <= _cache->dynMax);                    \
       if (_cache->inUse < _cache->dynMax)                            \
          _cache->inUse++;                                            \
       for (_i = _cache->inUse-1; _i >= 1; _i--)                      \
          _cache->ent[_i] = _cache->ent[_i-1];                        \
       _cache->ent[0].arg1 = _arg1;                                   \
       _cache->ent[0].arg2 = _arg2;                                   \
       _cache->ent[0].res  = _res;                                    \
    } while (0)


 //------------------------------------------------------------------//
 //---                          WordSet                           ---//
 //---                       Implementation                       ---//
 //------------------------------------------------------------------//

 typedef
    struct {
       WordSetU* owner; /* for sanity checking */
       UWord*    words;
       UWord     size; /* Really this should be SizeT */
    }
    WordVec;

 /* ix2vec[0 .. ix2vec_used-1] are pointers to the lock sets (WordVecs)
    really.  vec2ix is the inverse mapping, mapping WordVec* to the
    corresponding ix2vec entry number.  The two mappings are mutually
    redundant. */
 struct _WordSetU {
       void*     (*alloc)(HChar*,SizeT);
       HChar*    cc;
       void      (*dealloc)(void*);
       WordFM*   vec2ix; /* WordVec-to-WordSet mapping tree */
       WordVec** ix2vec; /* WordSet-to-WordVec mapping array */
       UWord     ix2vec_size;
       UWord     ix2vec_used;
       WordSet   empty; /* cached, for speed */
       /* Caches for some operations */
       WCache    cache_addTo;
       WCache    cache_delFrom;
       WCache    cache_intersect;
       WCache    cache_minus;
       /* Stats */
       UWord     n_add;
       UWord     n_add_uncached;
       UWord     n_del;
       UWord     n_del_uncached;
       UWord     n_union;
       UWord     n_intersect;
       UWord     n_intersect_uncached;
       UWord     n_minus;
       UWord     n_minus_uncached;
       UWord     n_elem;
       UWord     n_doubleton;
       UWord     n_isEmpty;
       UWord     n_isSingleton;
       UWord     n_anyElementOf;
       UWord     n_isSubsetOf;
    };

 /* Create a new WordVec of the given size. */

 static WordVec* new_WV_of_size ( WordSetU* wsu, UWord sz )
 {
    WordVec* wv;
    tl_assert(sz >= 0);
    wv = wsu->alloc( wsu->cc, sizeof(WordVec) );
    wv->owner = wsu;
    wv->words = NULL;
    wv->size = sz;
    if (sz > 0) {
      wv->words = wsu->alloc( wsu->cc, (SizeT)sz * sizeof(UWord) );
    }
    return wv;
 }

 static void delete_WV ( WordVec* wv )
 {
    void (*dealloc)(void*) = wv->owner->dealloc;
    if (wv->words) {
       dealloc(wv->words);
    }
    dealloc(wv);
 }
 static void delete_WV_for_FM ( UWord wv ) {
    delete_WV( (WordVec*)wv );
 }

 static Word cmp_WordVecs_for_FM ( UWord wv1W, UWord wv2W )
 {
    UWord    i;
    WordVec* wv1    = (WordVec*)wv1W;
    WordVec* wv2    = (WordVec*)wv2W;
    UWord    common = wv1->size < wv2->size ? wv1->size : wv2->size;
    for (i = 0; i < common; i++) {
       if (wv1->words[i] == wv2->words[i])
          continue;
       if (wv1->words[i] < wv2->words[i])
          return -1;
       if (wv1->words[i] > wv2->words[i])
          return 1;
       tl_assert(0);
    }
    /* Ok, the common sections are identical.  So now consider the
       tails.  Both sets are considered to finish in an implied
       sequence of -infinity. */
    if (wv1->size < wv2->size) {
       tl_assert(common == wv1->size);
       return -1; /* impliedly, wv1 contains some -infinitys in places
                     where wv2 doesn't. */
    }
    if (wv1->size > wv2->size) {
       tl_assert(common == wv2->size);
       return 1;
    }
    tl_assert(common == wv1->size);
    return 0; /* identical */
 }

 static void ensure_ix2vec_space ( WordSetU* wsu )
 {
    UInt      i, new_sz;
    WordVec** new_vec;
    tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
    if (wsu->ix2vec_used < wsu->ix2vec_size)
       return;
    new_sz = 2 * wsu->ix2vec_size;
    if (new_sz == 0) new_sz = 2;
    new_vec = wsu->alloc( wsu->cc, new_sz * sizeof(WordVec*) );
    tl_assert(new_vec);
    for (i = 0; i < wsu->ix2vec_size; i++)
       new_vec[i] = wsu->ix2vec[i];
    if (wsu->ix2vec)
       wsu->dealloc(wsu->ix2vec);
    wsu->ix2vec = new_vec;
    wsu->ix2vec_size = new_sz;
 }

 /* Index into a WordSetU, doing the obvious range check.  Failure of
    the assertions marked XXX and YYY is an indication of passing the
    wrong WordSetU* in the public API of this module. */
 static WordVec* do_ix2vec ( WordSetU* wsu, WordSet ws )
 {
    WordVec* wv;
    tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
    if (wsu->ix2vec_used > 0)
       tl_assert(wsu->ix2vec);
    /* If this assertion fails, it may mean you supplied a 'ws'
       that does not come from the 'wsu' universe. */
    tl_assert(ws < wsu->ix2vec_used); /* XXX */
    wv = wsu->ix2vec[ws];
    /* Make absolutely sure that 'ws' is a member of 'wsu'. */
    tl_assert(wv);
    tl_assert(wv->owner == wsu); /* YYY */
    return wv;
 }

 /* See if wv is contained within wsu.  If so, deallocate wv and return
    the index of the already-present copy.  If not, add wv to both the
    vec2ix and ix2vec mappings and return its index.
 */
 static WordSet add_or_dealloc_WordVec( WordSetU* wsu, WordVec* wv_new )
 {
    Bool     have;
    WordVec* wv_old;
    UWord/*Set*/ ix_old = -1;
    /* Really WordSet, but need something that can safely be casted to
       a Word* in the lookupFM.  Making it WordSet (which is 32 bits)
       causes failures on a 64-bit platform. */
    tl_assert(wv_new->owner == wsu);
    have = VG_(lookupFM)( wsu->vec2ix,
                          (Word*)&wv_old, (Word*)&ix_old,
                          (Word)wv_new );
    if (have) {
       tl_assert(wv_old != wv_new);
       tl_assert(wv_old);
       tl_assert(wv_old->owner == wsu);
       tl_assert(ix_old < wsu->ix2vec_used);
       tl_assert(wsu->ix2vec[ix_old] == wv_old);
       delete_WV( wv_new );
       return (WordSet)ix_old;
    } else {
       ensure_ix2vec_space( wsu );
       tl_assert(wsu->ix2vec);
       tl_assert(wsu->ix2vec_used < wsu->ix2vec_size);
       wsu->ix2vec[wsu->ix2vec_used] = wv_new;
       VG_(addToFM)( wsu->vec2ix, (Word)wv_new, (Word)wsu->ix2vec_used );
       if (0) VG_(printf)("aodW %d\n", (Int)wsu->ix2vec_used );
       wsu->ix2vec_used++;
       tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
       return (WordSet)(wsu->ix2vec_used - 1);
    }
 }


 WordSetU* HG_(newWordSetU) ( void* (*alloc_nofail)( HChar*, SizeT ),
                              HChar* cc,
                              void  (*dealloc)(void*),
                              Word  cacheSize )
 {
    WordSetU* wsu;
    WordVec*  empty;

    wsu          = alloc_nofail( cc, sizeof(WordSetU) );
    VG_(memset)( wsu, 0, sizeof(WordSetU) );
    wsu->alloc   = alloc_nofail;
    wsu->cc      = cc;
    wsu->dealloc = dealloc;
    wsu->vec2ix  = VG_(newFM)( alloc_nofail, cc,
                               dealloc, cmp_WordVecs_for_FM );
    wsu->ix2vec_used = 0;
    wsu->ix2vec_size = 0;
    wsu->ix2vec      = NULL;
    WCache_INIT(wsu->cache_addTo,     cacheSize);
    WCache_INIT(wsu->cache_delFrom,   cacheSize);
    WCache_INIT(wsu->cache_intersect, cacheSize);
    WCache_INIT(wsu->cache_minus,     cacheSize);
    empty = new_WV_of_size( wsu, 0 );
    wsu->empty = add_or_dealloc_WordVec( wsu, empty );

    return wsu;
 }

 void HG_(deleteWordSetU) ( WordSetU* wsu )
 {
    void (*dealloc)(void*) = wsu->dealloc;
    tl_assert(wsu->vec2ix);
    VG_(deleteFM)( wsu->vec2ix, delete_WV_for_FM, NULL/*val-finalizer*/ );
    if (wsu->ix2vec)
       dealloc(wsu->ix2vec);
    dealloc(wsu);
 }

 WordSet HG_(emptyWS) ( WordSetU* wsu )
 {
    return wsu->empty;
 }

 Bool HG_(isEmptyWS) ( WordSetU* wsu, WordSet ws )
 {
    WordVec* wv = do_ix2vec( wsu, ws );
    wsu->n_isEmpty++;
    if (wv->size == 0) {
       tl_assert(ws == wsu->empty);
       return True;
    } else {
       tl_assert(ws != wsu->empty);
       return False;
    }
 }

 Bool HG_(isSingletonWS) ( WordSetU* wsu, WordSet ws, UWord w )
 {
    WordVec* wv;
    tl_assert(wsu);
    wsu->n_isSingleton++;
    wv = do_ix2vec( wsu, ws );
    return (Bool)(wv->size == 1 && wv->words[0] == w);
 }

 UWord HG_(cardinalityWS) ( WordSetU* wsu, WordSet ws )
 {
    WordVec* wv;
    tl_assert(wsu);
    wv = do_ix2vec( wsu, ws );
    tl_assert(wv->size >= 0);
    return wv->size;
 }

 UWord HG_(anyElementOfWS) ( WordSetU* wsu, WordSet ws )
 {
    WordVec* wv;
    tl_assert(wsu);
    wsu->n_anyElementOf++;
    wv = do_ix2vec( wsu, ws );
    tl_assert(wv->size >= 1);
    return wv->words[0];
 }

 UWord HG_(cardinalityWSU) ( WordSetU* wsu )
 {
    tl_assert(wsu);
    return wsu->ix2vec_used;
 }

 void HG_(getPayloadWS) ( /*OUT*/UWord** words, /*OUT*/UWord* nWords,
                          WordSetU* wsu, WordSet ws )
 {
    WordVec* wv;
    tl_assert(wsu);
    wv = do_ix2vec( wsu, ws );
    tl_assert(wv->size >= 0);
    *nWords = wv->size;
    *words  = wv->words;
 }

 Bool HG_(plausibleWS) ( WordSetU* wsu, WordSet ws )
 {
    if (wsu == NULL) return False;
    if (ws < 0 || ws >= wsu->ix2vec_used)
       return False;
    return True;
 }

 Bool HG_(saneWS_SLOW) ( WordSetU* wsu, WordSet ws )
 {
    WordVec* wv;
    UWord    i;
    if (wsu == NULL) return False;
    if (ws < 0 || ws >= wsu->ix2vec_used)
       return False;
    wv = do_ix2vec( wsu, ws );
    /* can never happen .. do_ix2vec will assert instead.  Oh well. */
    if (wv->owner != wsu) return False;
    if (wv->size < 0) return False;
    if (wv->size > 0) {
       for (i = 0; i < wv->size-1; i++) {
          if (wv->words[i] >= wv->words[i+1])
             return False;
       }
    }
    return True;
 }

 Bool HG_(elemWS) ( WordSetU* wsu, WordSet ws, UWord w )
 {
    UWord    i;
    WordVec* wv = do_ix2vec( wsu, ws );
    wsu->n_elem++;
    for (i = 0; i < wv->size; i++) {
       if (wv->words[i] == w)
          return True;
    }
    return False;
 }

 WordSet HG_(doubletonWS) ( WordSetU* wsu, UWord w1, UWord w2 )
 {
    WordVec* wv;
    wsu->n_doubleton++;
    if (w1 == w2) {
       wv = new_WV_of_size(wsu, 1);
       wv->words[0] = w1;
    }
    else if (w1 < w2) {
       wv = new_WV_of_size(wsu, 2);
       wv->words[0] = w1;
       wv->words[1] = w2;
    }
    else {
       tl_assert(w1 > w2);
       wv = new_WV_of_size(wsu, 2);
       wv->words[0] = w2;
       wv->words[1] = w1;
    }
    return add_or_dealloc_WordVec( wsu, wv );
 }

 WordSet HG_(singletonWS) ( WordSetU* wsu, UWord w )
 {
    return HG_(doubletonWS)( wsu, w, w );
 }

 WordSet HG_(isSubsetOf) ( WordSetU* wsu, WordSet small, WordSet big )
 {
    wsu->n_isSubsetOf++;
    return small == HG_(intersectWS)( wsu, small, big );
 }

 void HG_(ppWS) ( WordSetU* wsu, WordSet ws )
 {
    UWord    i;
    WordVec* wv;
    tl_assert(wsu);
    wv = do_ix2vec( wsu, ws );
    VG_(printf)("{");
    for (i = 0; i < wv->size; i++) {
       VG_(printf)("%p", (void*)wv->words[i]);
       if (i < wv->size-1)
          VG_(printf)(",");
    }
    VG_(printf)("}");
 }

 void HG_(ppWSUstats) ( WordSetU* wsu, HChar* name )
 {
    VG_(printf)("   WordSet \"%s\":\n", name);
    VG_(printf)("      addTo        %10lu (%lu uncached)\n",
                wsu->n_add, wsu->n_add_uncached);
    VG_(printf)("      delFrom      %10lu (%lu uncached)\n",
                wsu->n_del, wsu->n_del_uncached);
    VG_(printf)("      union        %10lu\n", wsu->n_union);
    VG_(printf)("      intersect    %10lu (%lu uncached) "
                "[nb. incl isSubsetOf]\n",
                wsu->n_intersect, wsu->n_intersect_uncached);
    VG_(printf)("      minus        %10lu (%lu uncached)\n",
                wsu->n_minus, wsu->n_minus_uncached);
    VG_(printf)("      elem         %10lu\n",   wsu->n_elem);
    VG_(printf)("      doubleton    %10lu\n",   wsu->n_doubleton);
    VG_(printf)("      isEmpty      %10lu\n",   wsu->n_isEmpty);
    VG_(printf)("      isSingleton  %10lu\n",   wsu->n_isSingleton);
    VG_(printf)("      anyElementOf %10lu\n",   wsu->n_anyElementOf);
    VG_(printf)("      isSubsetOf   %10lu\n",   wsu->n_isSubsetOf);
 }

 WordSet HG_(addToWS) ( WordSetU* wsu, WordSet ws, UWord w )
 {
    UWord    k, j;
    WordVec* wv_new;
    WordVec* wv;
    WordSet  result = (WordSet)(-1); /* bogus */

    wsu->n_add++;
    WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_addTo, ws, w);
    wsu->n_add_uncached++;

    /* If already present, this is a no-op. */
    wv = do_ix2vec( wsu, ws );
    for (k = 0; k < wv->size; k++) {
       if (wv->words[k] == w) {
          result = ws;
          goto out;
       }
    }
    /* Ok, not present.  Build a new one ... */
    wv_new = new_WV_of_size( wsu, wv->size + 1 );
    k = j = 0;
    for (; k < wv->size && wv->words[k] < w; k++) {
       wv_new->words[j++] = wv->words[k];
    }
    wv_new->words[j++] = w;
    for (; k < wv->size; k++) {
       tl_assert(wv->words[k] > w);
       wv_new->words[j++] = wv->words[k];
    }
    tl_assert(j == wv_new->size);

    /* Find any existing copy, or add the new one. */
    result = add_or_dealloc_WordVec( wsu, wv_new );
    tl_assert(result != (WordSet)(-1));

   out:
    WCache_UPDATE(wsu->cache_addTo, ws, w, result);
    return result;
 }

 WordSet HG_(delFromWS) ( WordSetU* wsu, WordSet ws, UWord w )
 {
    UWord    i, j, k;
    WordVec* wv_new;
    WordSet  result = (WordSet)(-1); /* bogus */
    WordVec* wv = do_ix2vec( wsu, ws );

    wsu->n_del++;

    /* special case empty set */
    if (wv->size == 0) {
       tl_assert(ws == wsu->empty);
       return ws;
    }

    WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_delFrom, ws, w);
    wsu->n_del_uncached++;

    /* If not already present, this is a no-op. */
    for (i = 0; i < wv->size; i++) {
       if (wv->words[i] == w)
          break;
    }
    if (i == wv->size) {
       result = ws;
       goto out;
    }
    /* So w is present in ws, and the new set will be one element
       smaller. */
    tl_assert(i >= 0 && i < wv->size);
    tl_assert(wv->size > 0);

    wv_new = new_WV_of_size( wsu, wv->size - 1 );
    j = k = 0;
    for (; j < wv->size; j++) {
       if (j == i)
          continue;
       wv_new->words[k++] = wv->words[j];
    }
    tl_assert(k == wv_new->size);

    result = add_or_dealloc_WordVec( wsu, wv_new );
    if (wv->size == 1) {
       tl_assert(result == wsu->empty);
    }

   out:
    WCache_UPDATE(wsu->cache_delFrom, ws, w, result);
    return result;
 }

 WordSet HG_(unionWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
 {
    UWord    i1, i2, k, sz;
    WordVec* wv_new;
    WordVec* wv1 = do_ix2vec( wsu, ws1 );
    WordVec* wv2 = do_ix2vec( wsu, ws2 );
    wsu->n_union++;
    sz = 0;
    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       sz++;
       if (wv1->words[i1] < wv2->words[i2]) {
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          i2++;
       } else {
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);
    if (i1 == wv1->size && i2 < wv2->size) {
       sz += (wv2->size - i2);
    }
    if (i2 == wv2->size && i1 < wv1->size) {
       sz += (wv1->size - i1);
    }

    wv_new = new_WV_of_size( wsu, sz );
    k = 0;

    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       if (wv1->words[i1] < wv2->words[i2]) {
          wv_new->words[k++] = wv1->words[i1];
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          wv_new->words[k++] = wv2->words[i2];
          i2++;
       } else {
          wv_new->words[k++] = wv1->words[i1];
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);
    if (i1 == wv1->size && i2 < wv2->size) {
       while (i2 < wv2->size)
          wv_new->words[k++] = wv2->words[i2++];
    }
    if (i2 == wv2->size && i1 < wv1->size) {
       while (i1 < wv1->size)
          wv_new->words[k++] = wv1->words[i1++];
    }

    tl_assert(k == sz);

    return add_or_dealloc_WordVec( wsu, wv_new );
 }

 WordSet HG_(intersectWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
 {
    UWord    i1, i2, k, sz;
    WordSet  ws_new = (WordSet)(-1); /* bogus */
    WordVec* wv_new;
    WordVec* wv1;
    WordVec* wv2;

    wsu->n_intersect++;

    /* Deal with an obvious case fast. */
    if (ws1 == ws2)
       return ws1;

    /* Since intersect(x,y) == intersect(y,x), convert both variants to
       the same query.  This reduces the number of variants the cache
       has to deal with. */
    if (ws1 > ws2) {
       WordSet wst = ws1; ws1 = ws2; ws2 = wst;
    }

    WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_intersect, ws1, ws2);
    wsu->n_intersect_uncached++;

    wv1 = do_ix2vec( wsu, ws1 );
    wv2 = do_ix2vec( wsu, ws2 );
    sz = 0;
    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       if (wv1->words[i1] < wv2->words[i2]) {
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          i2++;
       } else {
          sz++;
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);

    wv_new = new_WV_of_size( wsu, sz );
    k = 0;

    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       if (wv1->words[i1] < wv2->words[i2]) {
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          i2++;
       } else {
          wv_new->words[k++] = wv1->words[i1];
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);

    tl_assert(k == sz);

    ws_new = add_or_dealloc_WordVec( wsu, wv_new );
    if (sz == 0) {
       tl_assert(ws_new == wsu->empty);
    }

    tl_assert(ws_new != (WordSet)(-1));
    WCache_UPDATE(wsu->cache_intersect, ws1, ws2, ws_new);

    return ws_new;
 }

 WordSet HG_(minusWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
 {
    UWord    i1, i2, k, sz;
    WordSet  ws_new = (WordSet)(-1); /* bogus */
    WordVec* wv_new;
    WordVec* wv1;
    WordVec* wv2;

    wsu->n_minus++;
    WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_minus, ws1, ws2);
    wsu->n_minus_uncached++;

    wv1 = do_ix2vec( wsu, ws1 );
    wv2 = do_ix2vec( wsu, ws2 );
    sz = 0;
    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       if (wv1->words[i1] < wv2->words[i2]) {
          sz++;
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          i2++;
       } else {
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);
    if (i2 == wv2->size && i1 < wv1->size) {
       sz += (wv1->size - i1);
    }

    wv_new = new_WV_of_size( wsu, sz );
    k = 0;

    i1 = i2 = 0;
    while (1) {
       if (i1 >= wv1->size || i2 >= wv2->size)
          break;
       if (wv1->words[i1] < wv2->words[i2]) {
          wv_new->words[k++] = wv1->words[i1];
          i1++;
       } else
       if (wv1->words[i1] > wv2->words[i2]) {
          i2++;
       } else {
          i1++;
          i2++;
       }
    }
    tl_assert(i1 <= wv1->size);
    tl_assert(i2 <= wv2->size);
    tl_assert(i1 == wv1->size || i2 == wv2->size);
    if (i2 == wv2->size && i1 < wv1->size) {
       while (i1 < wv1->size)
          wv_new->words[k++] = wv1->words[i1++];
    }

    tl_assert(k == sz);

    ws_new = add_or_dealloc_WordVec( wsu, wv_new );
    if (sz == 0) {
       tl_assert(ws_new == wsu->empty);
    }

    tl_assert(ws_new != (WordSet)(-1));
    WCache_UPDATE(wsu->cache_minus, ws1, ws2, ws_new);

    return ws_new;
 }

 static __attribute__((unused))
 void show_WS ( WordSetU* wsu, WordSet ws )
 {
    UWord i;
    WordVec* wv = do_ix2vec( wsu, ws );
    VG_(printf)("#%u{", ws);
    for (i = 0; i < wv->size; i++) {
       VG_(printf)("%lu", wv->words[i]);
       if (i < wv->size-1)
          VG_(printf)(",");
    }
    VG_(printf)("}\n");
 }

 //------------------------------------------------------------------//
 //---                        end WordSet                         ---//
 //---                       Implementation                       ---//
 //------------------------------------------------------------------//

 /*--------------------------------------------------------------------*/
 /*--- end                                             hg_wordset.c ---*/
 /*--------------------------------------------------------------------*/

	/--------------------------------------------------------------------/
	/--- Sets of words, with unique set identifiers. ---/
	/--- hg_wordset.c ---/
	/--------------------------------------------------------------------/

	/*
	This file is part of Helgrind, a Valgrind tool for detecting errors
	in threaded programs.

	Copyright (C) 2007-2008 OpenWorks LLP
	info@open-works.co.uk

	This program is free software; you can redistribute it and/or
	modify it under the terms of the GNU General Public License as
	published by the Free Software Foundation; either version 2 of the
	License, or (at your option) any later version.

	This program is distributed in the hope that it will be useful, but
	WITHOUT ANY WARRANTY; without even the implied warranty of
	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	General Public License for more details.

	You should have received a copy of the GNU General Public License
	along with this program; if not, write to the Free Software
	Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
	02111-1307, USA.

	The GNU General Public License is contained in the file COPYING.

	Neither the names of the U.S. Department of Energy nor the
	University of California nor the names of its contributors may be
	used to endorse or promote products derived from this software
	without prior written permission.
	*/

	#include "pub_tool_basics.h"
	#include "pub_tool_libcassert.h"
	#include "pub_tool_libcbase.h"
	#include "pub_tool_libcprint.h"
	#include "pub_tool_threadstate.h"
	#include "pub_tool_wordfm.h"

	#include "hg_basics.h"
	#include "hg_wordset.h" /* self */

	//------------------------------------------------------------------//
	//--- Word Cache ---//
	//------------------------------------------------------------------//

	typedef
	struct { UWord arg1; UWord arg2; UWord res; }
	WCacheEnt;

	/* Each cache is a fixed sized array of N_WCACHE_STAT_MAX entries.
	However only the first .dynMax are used. This is because at some
	point, expanding the cache further overall gives a slowdown because
	searching more entries more than negates any performance advantage
	from caching those entries in the first place. Hence use .dynMax
	to allow the size of the cache(s) to be set differently for each
	different WordSetU. */
	#define N_WCACHE_STAT_MAX 32
	typedef
	struct {
	WCacheEnt ent[N_WCACHE_STAT_MAX];
	UWord dynMax; /* 1 .. N_WCACHE_STAT_MAX inclusive */
	UWord inUse; /* 0 .. dynMax inclusive */
	}
	WCache;

	#define WCache_INIT(_zzcache,_zzdynmax) \
	do { \
	tl_assert((_zzdynmax) >= 1); \
	tl_assert((_zzdynmax) <= N_WCACHE_STAT_MAX); \
	(_zzcache).dynMax = (_zzdynmax); \
	(_zzcache).inUse = 0; \
	} while (0)

	#define WCache_LOOKUP_AND_RETURN(_retty,_zzcache,_zzarg1,_zzarg2) \
	do { \
	UWord _i; \
	UWord _arg1 = (UWord)(_zzarg1); \
	UWord _arg2 = (UWord)(_zzarg2); \
	WCache* _cache = &(_zzcache); \
	tl_assert(_cache->dynMax >= 1); \
	tl_assert(_cache->dynMax <= N_WCACHE_STAT_MAX); \
	tl_assert(_cache->inUse >= 0); \
	tl_assert(_cache->inUse <= _cache->dynMax); \
	if (_cache->inUse > 0) { \
	if (_cache->ent[0].arg1 == _arg1 \
	&& _cache->ent[0].arg2 == _arg2) \
	return (_retty)_cache->ent[0].res; \
	for (_i = 1; _i < _cache->inUse; _i++) { \
	if (_cache->ent[_i].arg1 == _arg1 \
	&& _cache->ent[_i].arg2 == _arg2) { \
	WCacheEnt tmp = _cache->ent[_i-1]; \
	_cache->ent[_i-1] = _cache->ent[_i]; \
	_cache->ent[_i] = tmp; \
	return (_retty)_cache->ent[_i-1].res; \
	} \
	} \
	} \
	} while (0)

	#define WCache_UPDATE(_zzcache,_zzarg1,_zzarg2,_zzresult) \
	do { \
	Word _i; \
	UWord _arg1 = (UWord)(_zzarg1); \
	UWord _arg2 = (UWord)(_zzarg2); \
	UWord _res = (UWord)(_zzresult); \
	WCache* _cache = &(_zzcache); \
	tl_assert(_cache->dynMax >= 1); \
	tl_assert(_cache->dynMax <= N_WCACHE_STAT_MAX); \
	tl_assert(_cache->inUse >= 0); \
	tl_assert(_cache->inUse <= _cache->dynMax); \
	if (_cache->inUse < _cache->dynMax) \
	_cache->inUse++; \
	for (_i = _cache->inUse-1; _i >= 1; _i--) \
	_cache->ent[_i] = _cache->ent[_i-1]; \
	_cache->ent[0].arg1 = _arg1; \
	_cache->ent[0].arg2 = _arg2; \
	_cache->ent[0].res = _res; \
	} while (0)


	//------------------------------------------------------------------//
	//--- WordSet ---//
	//--- Implementation ---//
	//------------------------------------------------------------------//

	typedef
	struct {
	WordSetU* owner; /* for sanity checking */
	UWord* words;
	UWord size; /* Really this should be SizeT */
	}
	WordVec;

	/* ix2vec[0 .. ix2vec_used-1] are pointers to the lock sets (WordVecs)
	really. vec2ix is the inverse mapping, mapping WordVec* to the
	corresponding ix2vec entry number. The two mappings are mutually
	redundant. */
	struct _WordSetU {
	void* (alloc)(HChar,SizeT);
	HChar* cc;
	void (dealloc)(void);
	WordFM* vec2ix; /* WordVec-to-WordSet mapping tree */
	WordVec** ix2vec; /* WordSet-to-WordVec mapping array */
	UWord ix2vec_size;
	UWord ix2vec_used;
	WordSet empty; /* cached, for speed */
	/* Caches for some operations */
	WCache cache_addTo;
	WCache cache_delFrom;
	WCache cache_intersect;
	WCache cache_minus;
	/* Stats */
	UWord n_add;
	UWord n_add_uncached;
	UWord n_del;
	UWord n_del_uncached;
	UWord n_union;
	UWord n_intersect;
	UWord n_intersect_uncached;
	UWord n_minus;
	UWord n_minus_uncached;
	UWord n_elem;
	UWord n_doubleton;
	UWord n_isEmpty;
	UWord n_isSingleton;
	UWord n_anyElementOf;
	UWord n_isSubsetOf;
	};

	/* Create a new WordVec of the given size. */

	static WordVec* new_WV_of_size ( WordSetU* wsu, UWord sz )
	{
	WordVec* wv;
	tl_assert(sz >= 0);
	wv = wsu->alloc( wsu->cc, sizeof(WordVec) );
	wv->owner = wsu;
	wv->words = NULL;
	wv->size = sz;
	if (sz > 0) {
	wv->words = wsu->alloc( wsu->cc, (SizeT)sz * sizeof(UWord) );
	}
	return wv;
	}

	static void delete_WV ( WordVec* wv )
	{
	void (dealloc)(void) = wv->owner->dealloc;
	if (wv->words) {
	dealloc(wv->words);
	}
	dealloc(wv);
	}
	static void delete_WV_for_FM ( UWord wv ) {
	delete_WV( (WordVec*)wv );
	}

	static Word cmp_WordVecs_for_FM ( UWord wv1W, UWord wv2W )
	{
	UWord i;
	WordVec* wv1 = (WordVec*)wv1W;
	WordVec* wv2 = (WordVec*)wv2W;
	UWord common = wv1->size < wv2->size ? wv1->size : wv2->size;
	for (i = 0; i < common; i++) {
	if (wv1->words[i] == wv2->words[i])
	continue;
	if (wv1->words[i] < wv2->words[i])
	return -1;
	if (wv1->words[i] > wv2->words[i])
	return 1;
	tl_assert(0);
	}
	/* Ok, the common sections are identical. So now consider the
	tails. Both sets are considered to finish in an implied
	sequence of -infinity. */
	if (wv1->size < wv2->size) {
	tl_assert(common == wv1->size);
	return -1; /* impliedly, wv1 contains some -infinitys in places
	where wv2 doesn't. */
	}
	if (wv1->size > wv2->size) {
	tl_assert(common == wv2->size);
	return 1;
	}
	tl_assert(common == wv1->size);
	return 0; /* identical */
	}

	static void ensure_ix2vec_space ( WordSetU* wsu )
	{
	UInt i, new_sz;
	WordVec** new_vec;
	tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
	if (wsu->ix2vec_used < wsu->ix2vec_size)
	return;
	new_sz = 2 * wsu->ix2vec_size;
	if (new_sz == 0) new_sz = 2;
	new_vec = wsu->alloc( wsu->cc, new_sz * sizeof(WordVec*) );
	tl_assert(new_vec);
	for (i = 0; i < wsu->ix2vec_size; i++)
	new_vec[i] = wsu->ix2vec[i];
	if (wsu->ix2vec)
	wsu->dealloc(wsu->ix2vec);
	wsu->ix2vec = new_vec;
	wsu->ix2vec_size = new_sz;
	}

	/* Index into a WordSetU, doing the obvious range check. Failure of
	the assertions marked XXX and YYY is an indication of passing the
	wrong WordSetU* in the public API of this module. */
	static WordVec* do_ix2vec ( WordSetU* wsu, WordSet ws )
	{
	WordVec* wv;
	tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
	if (wsu->ix2vec_used > 0)
	tl_assert(wsu->ix2vec);
	/* If this assertion fails, it may mean you supplied a 'ws'
	that does not come from the 'wsu' universe. */
	tl_assert(ws < wsu->ix2vec_used); /* XXX */
	wv = wsu->ix2vec[ws];
	/* Make absolutely sure that 'ws' is a member of 'wsu'. */
	tl_assert(wv);
	tl_assert(wv->owner == wsu); /* YYY */
	return wv;
	}

	/* See if wv is contained within wsu. If so, deallocate wv and return
	the index of the already-present copy. If not, add wv to both the
	vec2ix and ix2vec mappings and return its index.
	*/
	static WordSet add_or_dealloc_WordVec( WordSetU* wsu, WordVec* wv_new )
	{
	Bool have;
	WordVec* wv_old;
	UWord/Set/ ix_old = -1;
	/* Really WordSet, but need something that can safely be casted to
	a Word* in the lookupFM. Making it WordSet (which is 32 bits)
	causes failures on a 64-bit platform. */
	tl_assert(wv_new->owner == wsu);
	have = VG_(lookupFM)( wsu->vec2ix,
	(Word)&wv_old, (Word)&ix_old,
	(Word)wv_new );
	if (have) {
	tl_assert(wv_old != wv_new);
	tl_assert(wv_old);
	tl_assert(wv_old->owner == wsu);
	tl_assert(ix_old < wsu->ix2vec_used);
	tl_assert(wsu->ix2vec[ix_old] == wv_old);
	delete_WV( wv_new );
	return (WordSet)ix_old;
	} else {
	ensure_ix2vec_space( wsu );
	tl_assert(wsu->ix2vec);
	tl_assert(wsu->ix2vec_used < wsu->ix2vec_size);
	wsu->ix2vec[wsu->ix2vec_used] = wv_new;
	VG_(addToFM)( wsu->vec2ix, (Word)wv_new, (Word)wsu->ix2vec_used );
	if (0) VG_(printf)("aodW %d\n", (Int)wsu->ix2vec_used );
	wsu->ix2vec_used++;
	tl_assert(wsu->ix2vec_used <= wsu->ix2vec_size);
	return (WordSet)(wsu->ix2vec_used - 1);
	}
	}


	WordSetU* HG_(newWordSetU) ( void* (alloc_nofail)( HChar, SizeT ),
	HChar* cc,
	void (dealloc)(void),
	Word cacheSize )
	{
	WordSetU* wsu;
	WordVec* empty;

	wsu = alloc_nofail( cc, sizeof(WordSetU) );
	VG_(memset)( wsu, 0, sizeof(WordSetU) );
	wsu->alloc = alloc_nofail;
	wsu->cc = cc;
	wsu->dealloc = dealloc;
	wsu->vec2ix = VG_(newFM)( alloc_nofail, cc,
	dealloc, cmp_WordVecs_for_FM );
	wsu->ix2vec_used = 0;
	wsu->ix2vec_size = 0;
	wsu->ix2vec = NULL;
	WCache_INIT(wsu->cache_addTo, cacheSize);
	WCache_INIT(wsu->cache_delFrom, cacheSize);
	WCache_INIT(wsu->cache_intersect, cacheSize);
	WCache_INIT(wsu->cache_minus, cacheSize);
	empty = new_WV_of_size( wsu, 0 );
	wsu->empty = add_or_dealloc_WordVec( wsu, empty );

	return wsu;
	}

	void HG_(deleteWordSetU) ( WordSetU* wsu )
	{
	void (dealloc)(void) = wsu->dealloc;
	tl_assert(wsu->vec2ix);
	VG_(deleteFM)( wsu->vec2ix, delete_WV_for_FM, NULL/val-finalizer/ );
	if (wsu->ix2vec)
	dealloc(wsu->ix2vec);
	dealloc(wsu);
	}

	WordSet HG_(emptyWS) ( WordSetU* wsu )
	{
	return wsu->empty;
	}

	Bool HG_(isEmptyWS) ( WordSetU* wsu, WordSet ws )
	{
	WordVec* wv = do_ix2vec( wsu, ws );
	wsu->n_isEmpty++;
	if (wv->size == 0) {
	tl_assert(ws == wsu->empty);
	return True;
	} else {
	tl_assert(ws != wsu->empty);
	return False;
	}
	}

	Bool HG_(isSingletonWS) ( WordSetU* wsu, WordSet ws, UWord w )
	{
	WordVec* wv;
	tl_assert(wsu);
	wsu->n_isSingleton++;
	wv = do_ix2vec( wsu, ws );
	return (Bool)(wv->size == 1 && wv->words[0] == w);
	}

	UWord HG_(cardinalityWS) ( WordSetU* wsu, WordSet ws )
	{
	WordVec* wv;
	tl_assert(wsu);
	wv = do_ix2vec( wsu, ws );
	tl_assert(wv->size >= 0);
	return wv->size;
	}

	UWord HG_(anyElementOfWS) ( WordSetU* wsu, WordSet ws )
	{
	WordVec* wv;
	tl_assert(wsu);
	wsu->n_anyElementOf++;
	wv = do_ix2vec( wsu, ws );
	tl_assert(wv->size >= 1);
	return wv->words[0];
	}

	UWord HG_(cardinalityWSU) ( WordSetU* wsu )
	{
	tl_assert(wsu);
	return wsu->ix2vec_used;
	}

	void HG_(getPayloadWS) ( /OUT/UWord** words, /OUT/UWord* nWords,
	WordSetU* wsu, WordSet ws )
	{
	WordVec* wv;
	tl_assert(wsu);
	wv = do_ix2vec( wsu, ws );
	tl_assert(wv->size >= 0);
	*nWords = wv->size;
	*words = wv->words;
	}

	Bool HG_(plausibleWS) ( WordSetU* wsu, WordSet ws )
	{
	if (wsu == NULL) return False;
	if (ws < 0 \|\| ws >= wsu->ix2vec_used)
	return False;
	return True;
	}

	Bool HG_(saneWS_SLOW) ( WordSetU* wsu, WordSet ws )
	{
	WordVec* wv;
	UWord i;
	if (wsu == NULL) return False;
	if (ws < 0 \|\| ws >= wsu->ix2vec_used)
	return False;
	wv = do_ix2vec( wsu, ws );
	/* can never happen .. do_ix2vec will assert instead. Oh well. */
	if (wv->owner != wsu) return False;
	if (wv->size < 0) return False;
	if (wv->size > 0) {
	for (i = 0; i < wv->size-1; i++) {
	if (wv->words[i] >= wv->words[i+1])
	return False;
	}
	}
	return True;
	}

	Bool HG_(elemWS) ( WordSetU* wsu, WordSet ws, UWord w )
	{
	UWord i;
	WordVec* wv = do_ix2vec( wsu, ws );
	wsu->n_elem++;
	for (i = 0; i < wv->size; i++) {
	if (wv->words[i] == w)
	return True;
	}
	return False;
	}

	WordSet HG_(doubletonWS) ( WordSetU* wsu, UWord w1, UWord w2 )
	{
	WordVec* wv;
	wsu->n_doubleton++;
	if (w1 == w2) {
	wv = new_WV_of_size(wsu, 1);
	wv->words[0] = w1;
	}
	else if (w1 < w2) {
	wv = new_WV_of_size(wsu, 2);
	wv->words[0] = w1;
	wv->words[1] = w2;
	}
	else {
	tl_assert(w1 > w2);
	wv = new_WV_of_size(wsu, 2);
	wv->words[0] = w2;
	wv->words[1] = w1;
	}
	return add_or_dealloc_WordVec( wsu, wv );
	}

	WordSet HG_(singletonWS) ( WordSetU* wsu, UWord w )
	{
	return HG_(doubletonWS)( wsu, w, w );
	}

	WordSet HG_(isSubsetOf) ( WordSetU* wsu, WordSet small, WordSet big )
	{
	wsu->n_isSubsetOf++;
	return small == HG_(intersectWS)( wsu, small, big );
	}

	void HG_(ppWS) ( WordSetU* wsu, WordSet ws )
	{
	UWord i;
	WordVec* wv;
	tl_assert(wsu);
	wv = do_ix2vec( wsu, ws );
	VG_(printf)("{");
	for (i = 0; i < wv->size; i++) {
	VG_(printf)("%p", (void*)wv->words[i]);
	if (i < wv->size-1)
	VG_(printf)(",");
	}
	VG_(printf)("}");
	}

	void HG_(ppWSUstats) ( WordSetU* wsu, HChar* name )
	{
	VG_(printf)(" WordSet \"%s\":\n", name);
	VG_(printf)(" addTo %10lu (%lu uncached)\n",
	wsu->n_add, wsu->n_add_uncached);
	VG_(printf)(" delFrom %10lu (%lu uncached)\n",
	wsu->n_del, wsu->n_del_uncached);
	VG_(printf)(" union %10lu\n", wsu->n_union);
	VG_(printf)(" intersect %10lu (%lu uncached) "
	"[nb. incl isSubsetOf]\n",
	wsu->n_intersect, wsu->n_intersect_uncached);
	VG_(printf)(" minus %10lu (%lu uncached)\n",
	wsu->n_minus, wsu->n_minus_uncached);
	VG_(printf)(" elem %10lu\n", wsu->n_elem);
	VG_(printf)(" doubleton %10lu\n", wsu->n_doubleton);
	VG_(printf)(" isEmpty %10lu\n", wsu->n_isEmpty);
	VG_(printf)(" isSingleton %10lu\n", wsu->n_isSingleton);
	VG_(printf)(" anyElementOf %10lu\n", wsu->n_anyElementOf);
	VG_(printf)(" isSubsetOf %10lu\n", wsu->n_isSubsetOf);
	}

	WordSet HG_(addToWS) ( WordSetU* wsu, WordSet ws, UWord w )
	{
	UWord k, j;
	WordVec* wv_new;
	WordVec* wv;
	WordSet result = (WordSet)(-1); /* bogus */

	wsu->n_add++;
	WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_addTo, ws, w);
	wsu->n_add_uncached++;

	/* If already present, this is a no-op. */
	wv = do_ix2vec( wsu, ws );
	for (k = 0; k < wv->size; k++) {
	if (wv->words[k] == w) {
	result = ws;
	goto out;
	}
	}
	/* Ok, not present. Build a new one ... */
	wv_new = new_WV_of_size( wsu, wv->size + 1 );
	k = j = 0;
	for (; k < wv->size && wv->words[k] < w; k++) {
	wv_new->words[j++] = wv->words[k];
	}
	wv_new->words[j++] = w;
	for (; k < wv->size; k++) {
	tl_assert(wv->words[k] > w);
	wv_new->words[j++] = wv->words[k];
	}
	tl_assert(j == wv_new->size);

	/* Find any existing copy, or add the new one. */
	result = add_or_dealloc_WordVec( wsu, wv_new );
	tl_assert(result != (WordSet)(-1));

	out:
	WCache_UPDATE(wsu->cache_addTo, ws, w, result);
	return result;
	}

	WordSet HG_(delFromWS) ( WordSetU* wsu, WordSet ws, UWord w )
	{
	UWord i, j, k;
	WordVec* wv_new;
	WordSet result = (WordSet)(-1); /* bogus */
	WordVec* wv = do_ix2vec( wsu, ws );

	wsu->n_del++;

	/* special case empty set */
	if (wv->size == 0) {
	tl_assert(ws == wsu->empty);
	return ws;
	}

	WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_delFrom, ws, w);
	wsu->n_del_uncached++;

	/* If not already present, this is a no-op. */
	for (i = 0; i < wv->size; i++) {
	if (wv->words[i] == w)
	break;
	}
	if (i == wv->size) {
	result = ws;
	goto out;
	}
	/* So w is present in ws, and the new set will be one element
	smaller. */
	tl_assert(i >= 0 && i < wv->size);
	tl_assert(wv->size > 0);

	wv_new = new_WV_of_size( wsu, wv->size - 1 );
	j = k = 0;
	for (; j < wv->size; j++) {
	if (j == i)
	continue;
	wv_new->words[k++] = wv->words[j];
	}
	tl_assert(k == wv_new->size);

	result = add_or_dealloc_WordVec( wsu, wv_new );
	if (wv->size == 1) {
	tl_assert(result == wsu->empty);
	}

	out:
	WCache_UPDATE(wsu->cache_delFrom, ws, w, result);
	return result;
	}

	WordSet HG_(unionWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
	{
	UWord i1, i2, k, sz;
	WordVec* wv_new;
	WordVec* wv1 = do_ix2vec( wsu, ws1 );
	WordVec* wv2 = do_ix2vec( wsu, ws2 );
	wsu->n_union++;
	sz = 0;
	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	sz++;
	if (wv1->words[i1] < wv2->words[i2]) {
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	i2++;
	} else {
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);
	if (i1 == wv1->size && i2 < wv2->size) {
	sz += (wv2->size - i2);
	}
	if (i2 == wv2->size && i1 < wv1->size) {
	sz += (wv1->size - i1);
	}

	wv_new = new_WV_of_size( wsu, sz );
	k = 0;

	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	if (wv1->words[i1] < wv2->words[i2]) {
	wv_new->words[k++] = wv1->words[i1];
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	wv_new->words[k++] = wv2->words[i2];
	i2++;
	} else {
	wv_new->words[k++] = wv1->words[i1];
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);
	if (i1 == wv1->size && i2 < wv2->size) {
	while (i2 < wv2->size)
	wv_new->words[k++] = wv2->words[i2++];
	}
	if (i2 == wv2->size && i1 < wv1->size) {
	while (i1 < wv1->size)
	wv_new->words[k++] = wv1->words[i1++];
	}

	tl_assert(k == sz);

	return add_or_dealloc_WordVec( wsu, wv_new );
	}

	WordSet HG_(intersectWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
	{
	UWord i1, i2, k, sz;
	WordSet ws_new = (WordSet)(-1); /* bogus */
	WordVec* wv_new;
	WordVec* wv1;
	WordVec* wv2;

	wsu->n_intersect++;

	/* Deal with an obvious case fast. */
	if (ws1 == ws2)
	return ws1;

	/* Since intersect(x,y) == intersect(y,x), convert both variants to
	the same query. This reduces the number of variants the cache
	has to deal with. */
	if (ws1 > ws2) {
	WordSet wst = ws1; ws1 = ws2; ws2 = wst;
	}

	WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_intersect, ws1, ws2);
	wsu->n_intersect_uncached++;

	wv1 = do_ix2vec( wsu, ws1 );
	wv2 = do_ix2vec( wsu, ws2 );
	sz = 0;
	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	if (wv1->words[i1] < wv2->words[i2]) {
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	i2++;
	} else {
	sz++;
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);

	wv_new = new_WV_of_size( wsu, sz );
	k = 0;

	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	if (wv1->words[i1] < wv2->words[i2]) {
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	i2++;
	} else {
	wv_new->words[k++] = wv1->words[i1];
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);

	tl_assert(k == sz);

	ws_new = add_or_dealloc_WordVec( wsu, wv_new );
	if (sz == 0) {
	tl_assert(ws_new == wsu->empty);
	}

	tl_assert(ws_new != (WordSet)(-1));
	WCache_UPDATE(wsu->cache_intersect, ws1, ws2, ws_new);

	return ws_new;
	}

	WordSet HG_(minusWS) ( WordSetU* wsu, WordSet ws1, WordSet ws2 )
	{
	UWord i1, i2, k, sz;
	WordSet ws_new = (WordSet)(-1); /* bogus */
	WordVec* wv_new;
	WordVec* wv1;
	WordVec* wv2;

	wsu->n_minus++;
	WCache_LOOKUP_AND_RETURN(WordSet, wsu->cache_minus, ws1, ws2);
	wsu->n_minus_uncached++;

	wv1 = do_ix2vec( wsu, ws1 );
	wv2 = do_ix2vec( wsu, ws2 );
	sz = 0;
	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	if (wv1->words[i1] < wv2->words[i2]) {
	sz++;
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	i2++;
	} else {
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);
	if (i2 == wv2->size && i1 < wv1->size) {
	sz += (wv1->size - i1);
	}

	wv_new = new_WV_of_size( wsu, sz );
	k = 0;

	i1 = i2 = 0;
	while (1) {
	if (i1 >= wv1->size \|\| i2 >= wv2->size)
	break;
	if (wv1->words[i1] < wv2->words[i2]) {
	wv_new->words[k++] = wv1->words[i1];
	i1++;
	} else
	if (wv1->words[i1] > wv2->words[i2]) {
	i2++;
	} else {
	i1++;
	i2++;
	}
	}
	tl_assert(i1 <= wv1->size);
	tl_assert(i2 <= wv2->size);
	tl_assert(i1 == wv1->size \|\| i2 == wv2->size);
	if (i2 == wv2->size && i1 < wv1->size) {
	while (i1 < wv1->size)
	wv_new->words[k++] = wv1->words[i1++];
	}

	tl_assert(k == sz);

	ws_new = add_or_dealloc_WordVec( wsu, wv_new );
	if (sz == 0) {
	tl_assert(ws_new == wsu->empty);
	}

	tl_assert(ws_new != (WordSet)(-1));
	WCache_UPDATE(wsu->cache_minus, ws1, ws2, ws_new);

	return ws_new;
	}

	static __attribute__((unused))
	void show_WS ( WordSetU* wsu, WordSet ws )
	{
	UWord i;
	WordVec* wv = do_ix2vec( wsu, ws );
	VG_(printf)("#%u{", ws);
	for (i = 0; i < wv->size; i++) {
	VG_(printf)("%lu", wv->words[i]);
	if (i < wv->size-1)
	VG_(printf)(",");
	}
	VG_(printf)("}\n");
	}

	//------------------------------------------------------------------//
	//--- end WordSet ---//
	//--- Implementation ---//
	//------------------------------------------------------------------//

	/--------------------------------------------------------------------/
	/--- end hg_wordset.c ---/
	/--------------------------------------------------------------------/