1 /*--------------------------------------------------------------------*/
2 /*--- A pool (memory) allocator that avoids duplicated copies.     ---*/
3 /*---                                           m_deduppoolalloc.c ---*/
4 /*--------------------------------------------------------------------*/
5 /*
6    This file is part of Valgrind, a dynamic binary instrumentation
7    framework.
8 
9    Copyright (C) 2014-2014 Philippe Waroquiers philippe.waroquiers@skynet.be
10 
11    This program is free software; you can redistribute it and/or
12    modify it under the terms of the GNU General Public License as
13    published by the Free Software Foundation; either version 2 of the
14    License, or (at your option) any later version.
15 
16    This program is distributed in the hope that it will be useful, but
17    WITHOUT ANY WARRANTY; without even the implied warranty of
18    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
19    General Public License for more details.
20 
21    You should have received a copy of the GNU General Public License
22    along with this program; if not, write to the Free Software
23    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
24    02111-1307, USA.
25 
26    The GNU General Public License is contained in the file COPYING.
27 */
28 
29 #include "pub_core_basics.h"
30 #include "pub_core_libcbase.h"
31 #include "pub_core_libcprint.h"
32 #include "pub_core_libcassert.h"
33 #include "pub_core_xarray.h"
34 #include "pub_core_deduppoolalloc.h" /* self */
35 #include "pub_core_hashtable.h"
36 #include "pub_core_poolalloc.h"
37 #include "pub_core_options.h"
38 #include "pub_core_mallocfree.h"
39 #include "pub_core_debuglog.h"
40 
41 struct _DedupPoolAlloc {
42    SizeT  poolSzB; /* Minimum size of a pool. */
43    SizeT  fixedSzb; /* If using VG_(allocFixedEltDedupPA), size of elements */
44    SizeT  eltAlign;
45    void*   (*alloc_fn)(const HChar*, SizeT); /* pool allocator */
46    const HChar*  cc; /* pool allocator's cost centre */
47    void    (*free_fn)(void*); /* pool allocator's deallocation function */
48    /* XArray of void* (pointers to pools).  The pools themselves.
49       Each element is a pointer to a block of size at least PoolSzB bytes.
50       The last block might be smaller due to a call to shrink_block. */
51    XArray *pools;
52 
53    /* hash table of pool elements, used to dedup.
54       If NULL, it means the DedupPoolAlloc is frozen. */
55    VgHashTable *ht_elements;
56 
57    /* Hash table nodes of pool_elements are allocated with a pool, to
58       decrease memory overhead during insertion in the DedupPoolAlloc. */
59    PoolAlloc *ht_node_pa;
60 
61    UChar *curpool;       /* last allocated pool. */
62    UChar *curpool_free;  /* Pos in current pool to allocate next elt.
63                             always aligned on eltAlign. */
64    UChar *curpool_limit; /* Last pos in current pool. */
65    /* Note that for a fixed size pool, we only have a single pool to allow
66       simple/fast indexing. This single pool is grown, which might change
67       the address of the already allocated elements. */
68 
69    /* Total nr of alloc calls, resulting in (we hope) a lot less
70       real (dedup) elements. */
71    ULong nr_alloc_calls;
72 };
73 
74 typedef
75    struct _ht_node {
76       struct _ht_node *next; // Read/Write by hashtable (pub_tool_hashtable.h)
77       UWord   key;           // Read by hashtable (pub_tool_hashtable.h)
78       SizeT   eltSzB;
79       const void *elt;
80    }
81    ht_node;
82 
VG_(newDedupPA)83 DedupPoolAlloc* VG_(newDedupPA) ( SizeT  poolSzB,
84                                   SizeT  eltAlign,
85                                   void*  (*alloc_fn)(const HChar*, SizeT),
86                                   const  HChar* cc,
87                                   void   (*free_fn)(void*) )
88 {
89    DedupPoolAlloc* ddpa;
90    vg_assert(poolSzB >= eltAlign);
91    vg_assert(poolSzB >= 100); /* let's say */
92    vg_assert(poolSzB >= 10*eltAlign); /* let's say */
93    vg_assert(alloc_fn);
94    vg_assert(cc);
95    vg_assert(free_fn);
96    ddpa = alloc_fn(cc, sizeof(*ddpa));
97    VG_(memset)(ddpa, 0, sizeof(*ddpa));
98    ddpa->poolSzB  = poolSzB;
99    ddpa->fixedSzb = 0;
100    ddpa->eltAlign = eltAlign;
101    ddpa->alloc_fn = alloc_fn;
102    ddpa->cc       = cc;
103    ddpa->free_fn  = free_fn;
104    ddpa->pools    = VG_(newXA)( alloc_fn, cc, free_fn, sizeof(void*) );
105 
106    ddpa->ht_elements = VG_(HT_construct) (cc);
107    ddpa->ht_node_pa = VG_(newPA) ( sizeof(ht_node),
108                                    1000,
109                                    alloc_fn,
110                                    cc,
111                                    free_fn);
112    ddpa->curpool = NULL;
113    ddpa->curpool_limit = NULL;
114    ddpa->curpool_free = NULL;
115 
116    return ddpa;
117 }
118 
VG_(deleteDedupPA)119 void VG_(deleteDedupPA) ( DedupPoolAlloc* ddpa)
120 {
121    Word i;
122    if (ddpa->ht_elements)
123       // Free data structures used for insertion.
124       VG_(freezeDedupPA) (ddpa, NULL);
125    for (i = 0; i < VG_(sizeXA) (ddpa->pools); i++)
126       ddpa->free_fn (*(UWord **)VG_(indexXA) ( ddpa->pools, i ));
127    VG_(deleteXA) (ddpa->pools);
128    ddpa->free_fn (ddpa);
129 }
130 
131 static __inline__
ddpa_align(DedupPoolAlloc * ddpa,UChar * c)132 UChar* ddpa_align ( DedupPoolAlloc* ddpa, UChar *c )
133 {
134    return (UChar*)VG_ROUNDUP(c, ddpa->eltAlign);
135 }
136 
137 /* Allocate a new pool or grow the (only) pool for a fixed size ddpa. */
138 __attribute__((noinline))
ddpa_add_new_pool_or_grow(DedupPoolAlloc * ddpa)139 static void ddpa_add_new_pool_or_grow ( DedupPoolAlloc* ddpa )
140 {
141    vg_assert(ddpa);
142 
143    if (ddpa->fixedSzb > 0 && ddpa->curpool != NULL) {
144       // Grow (* 2) the current (fixed elt) pool
145       UChar *curpool_align = ddpa_align(ddpa, ddpa->curpool);
146       SizeT curpool_used = ddpa->curpool_free - curpool_align;
147       SizeT curpool_size = ddpa->curpool_limit - ddpa->curpool + 1;
148       UChar *newpool = ddpa->alloc_fn (ddpa->cc, 2 * curpool_size);
149       UChar *newpool_free = ddpa_align (ddpa, newpool);
150       UChar *newpool_limit = newpool + 2 * curpool_size - 1;
151       Word reloc_offset = (Addr)newpool_free - (Addr)curpool_align;
152       ht_node *n;
153 
154       VG_(memcpy) (newpool_free, curpool_align, curpool_used);
155       /* We have reallocated the (only) pool. We need to relocate the pointers
156          in the hash table nodes. */
157       VG_(HT_ResetIter) (ddpa->ht_elements);
158       while ((n = VG_(HT_Next) (ddpa->ht_elements))) {
159         n->elt = (void*)((Addr)n->elt + reloc_offset);
160       }
161       newpool_free += curpool_used;
162 
163       VG_(dropHeadXA) (ddpa->pools, 1);
164       ddpa->free_fn (ddpa->curpool);
165       ddpa->curpool = newpool;
166       ddpa->curpool_free = newpool_free;
167       ddpa->curpool_limit = newpool_limit;
168       VG_(addToXA)( ddpa->pools, &ddpa->curpool);
169    } else {
170       /* Allocate a new pool, or allocate the first/only pool for a
171          fixed size ddpa. */
172       ddpa->curpool = ddpa->alloc_fn( ddpa->cc, ddpa->poolSzB);
173       ddpa->curpool_limit = ddpa->curpool + ddpa->poolSzB - 1;
174       ddpa->curpool_free = ddpa_align (ddpa, ddpa->curpool);
175       /* add to our collection of pools */
176       VG_(addToXA)( ddpa->pools, &ddpa->curpool );
177    }
178 }
179 
180 /* Compare function for 'gen' hash table. No need to compare the key
181    in this function, as the hash table already does it for us,
182    and that in any case, if the data is equal, the keys must also be
183    equal. */
cmp_pool_elt(const void * node1,const void * node2)184 static Word cmp_pool_elt (const void* node1, const void* node2 )
185 {
186    const ht_node* hnode1 = node1;
187    const ht_node* hnode2 = node2;
188 
189    /* As this function is called by hashtable, that has already checked
190       for key equality, it is likely that it is the 'good' element.
191       So, we handle the equal case first. */
192    if (hnode1->eltSzB == hnode2->eltSzB)
193       return VG_(memcmp) (hnode1->elt, hnode2->elt, hnode1->eltSzB);
194    else if (hnode1->eltSzB < hnode2->eltSzB)
195       return -1;
196    else
197       return 1;
198 }
199 
200 /* Print some stats. */
print_stats(DedupPoolAlloc * ddpa)201 static void print_stats (DedupPoolAlloc *ddpa)
202 {
203    VG_(message)(Vg_DebugMsg,
204                 "dedupPA:%s %ld allocs (%d uniq)"
205                 " %ld pools (%ld bytes free in last pool)\n",
206                 ddpa->cc,
207                 (long int) ddpa->nr_alloc_calls,
208                 VG_(HT_count_nodes)(ddpa->ht_elements),
209                 VG_(sizeXA)(ddpa->pools),
210                 ddpa->curpool ?
211                 (long int) (ddpa->curpool_limit - ddpa->curpool_free + 1) : 0);
212    VG_(HT_print_stats) (ddpa->ht_elements, cmp_pool_elt);
213 }
214 
215 /* Dummy free, as the ht elements are allocated in a pool, and
216    we will destroy the pool in one single operation. */
htelem_dummyfree(void * ht_elem)217 static void htelem_dummyfree(void* ht_elem)
218 {
219 }
220 
VG_(freezeDedupPA)221 void VG_(freezeDedupPA) (DedupPoolAlloc *ddpa,
222                          void (*shrink_block)(void*, SizeT))
223 {
224    if (VG_(clo_stats)
225        && (VG_(clo_verbosity) > 2 || VG_(debugLog_getLevel) () >= 2)) {
226       print_stats(ddpa);
227    }
228    vg_assert (!ddpa->fixedSzb || VG_(sizeXA) (ddpa->pools) == 1);
229    if (shrink_block && ddpa->curpool_limit > ddpa->curpool_free)
230       (*shrink_block)(ddpa->curpool, ddpa->curpool_free - ddpa->curpool);
231    VG_(HT_destruct) ( ddpa->ht_elements, htelem_dummyfree);
232    ddpa->ht_elements = NULL;
233    VG_(deletePA) (ddpa->ht_node_pa);
234    ddpa->ht_node_pa = NULL;
235 }
236 
237 
238 // hash function used by gawk and SDBM.
sdbm_hash(const UChar * buf,UInt len)239 static UInt sdbm_hash (const UChar* buf, UInt len )
240 {
241   UInt h;
242   UInt i;
243 
244   h = 0;
245   for (i = 0; i < len; i++)
246     h = *buf++ + (h<<6) + (h<<16) - h;
247   return h;
248 }
249 
VG_(allocEltDedupPA)250 const void* VG_(allocEltDedupPA) (DedupPoolAlloc *ddpa, SizeT eltSzB,
251                                   const void *elt)
252 {
253    ht_node ht_elt;
254    void* elt_ins;
255    ht_node *ht_ins;
256    vg_assert(ddpa);
257    vg_assert(ddpa->ht_elements);
258    vg_assert (eltSzB <= ddpa->poolSzB);
259 
260    ddpa->nr_alloc_calls++;
261 
262    ht_elt.key = sdbm_hash (elt, eltSzB);
263 
264    ht_elt.eltSzB = eltSzB;
265    ht_elt.elt = elt;
266 
267    ht_ins = VG_(HT_gen_lookup) (ddpa->ht_elements, &ht_elt, cmp_pool_elt);
268    if (ht_ins)
269       return ht_ins->elt;
270 
271    /* Not found -> we need to allocate a new element from the pool
272       and insert it in the hash table of inserted elements. */
273 
274    // Add a new pool or grow pool if not enough space in the current pool
275    if (UNLIKELY(ddpa->curpool_free == NULL
276                 || ddpa->curpool_free + eltSzB - 1 > ddpa->curpool_limit)) {
277       ddpa_add_new_pool_or_grow (ddpa);
278    }
279 
280    elt_ins = ddpa->curpool_free;
281    VG_(memcpy)(elt_ins, elt, eltSzB);
282    ddpa->curpool_free = ddpa_align(ddpa, ddpa->curpool_free + eltSzB);
283 
284    ht_ins = VG_(allocEltPA) (ddpa->ht_node_pa);
285    ht_ins->key = ht_elt.key;
286    ht_ins->eltSzB = eltSzB;
287    ht_ins->elt = elt_ins;
288    VG_(HT_add_node)(ddpa->ht_elements, ht_ins);
289    return elt_ins;
290 }
291 
292 static __inline__
elt2nr(DedupPoolAlloc * ddpa,const void * dedup_elt)293 UInt elt2nr (DedupPoolAlloc *ddpa, const void *dedup_elt)
294 {
295    vg_assert (dedup_elt >= (const void *)ddpa->curpool
296               && dedup_elt < (const void *)ddpa->curpool_free);
297    return 1 + ((const UChar*)dedup_elt - (const UChar *)ddpa->curpool)
298       / VG_ROUNDUP(ddpa->fixedSzb, ddpa->eltAlign);
299 }
300 
VG_(allocFixedEltDedupPA)301 UInt VG_(allocFixedEltDedupPA) (DedupPoolAlloc *ddpa,
302                                 SizeT eltSzB, const void *elt)
303 {
304    if (ddpa->fixedSzb == 0) {
305       // First insertion in this ddpa
306       vg_assert (ddpa->nr_alloc_calls == 0);
307       vg_assert (eltSzB > 0);
308       ddpa->fixedSzb = eltSzB;
309    }
310    vg_assert (ddpa->fixedSzb == eltSzB);
311    const void *dedup_elt = VG_(allocEltDedupPA) (ddpa, eltSzB, elt);
312    return elt2nr (ddpa, dedup_elt);
313 }
314 
VG_(indexEltNumber)315 void* VG_(indexEltNumber) (DedupPoolAlloc *ddpa,
316                            UInt eltNr)
317 {
318    void *dedup_elt;
319 
320    dedup_elt = ddpa->curpool
321       + (eltNr - 1) * VG_ROUNDUP(ddpa->fixedSzb, ddpa->eltAlign);
322 
323    vg_assert ((UChar*)dedup_elt >= ddpa->curpool
324               && (UChar*)dedup_elt < ddpa->curpool_free);
325 
326    return dedup_elt;
327 }
328 
VG_(sizeDedupPA)329 UInt VG_(sizeDedupPA) (DedupPoolAlloc *ddpa)
330 {
331    if (ddpa->curpool == NULL)
332       return 0;
333 
334    vg_assert (ddpa->fixedSzb);
335    return (ddpa->curpool_free - ddpa_align(ddpa, ddpa->curpool))
336       / VG_ROUNDUP(ddpa->fixedSzb, ddpa->eltAlign);
337 }
338