/* Generic string table handling. Copyright (C) 2000, 2001, 2002, 2005 Red Hat, Inc. This file is part of elfutils. Written by Ulrich Drepper , 2000. This file is free software; you can redistribute it and/or modify it under the terms of either * the GNU Lesser General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version or * the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version or both in parallel, as here. elfutils is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received copies of the GNU General Public License and the GNU Lesser General Public License along with this program. If not, see . */ #ifdef HAVE_CONFIG_H # include #endif #include #include #include #include #include #include #include #include #include "libebl.h" #ifndef MIN # define MIN(a, b) ((a) < (b) ? (a) : (b)) #endif struct Ebl_GStrent { const char *string; size_t len; struct Ebl_GStrent *next; struct Ebl_GStrent *left; struct Ebl_GStrent *right; size_t offset; unsigned int width; char reverse[0]; }; struct memoryblock { struct memoryblock *next; char memory[0]; }; struct Ebl_GStrtab { struct Ebl_GStrent *root; struct memoryblock *memory; char *backp; size_t left; size_t total; unsigned int width; bool nullstr; struct Ebl_GStrent null; }; /* Cache for the pagesize. We correct this value a bit so that `malloc' is not allocating more than a page. */ static size_t ps; struct Ebl_GStrtab * ebl_gstrtabinit (unsigned int width, bool nullstr) { struct Ebl_GStrtab *ret; if (ps == 0) { ps = sysconf (_SC_PAGESIZE) - 2 * sizeof (void *); assert (sizeof (struct memoryblock) < ps); } ret = (struct Ebl_GStrtab *) calloc (1, sizeof (struct Ebl_GStrtab)); if (ret != NULL) { ret->width = width; ret->nullstr = nullstr; if (nullstr) { ret->null.len = 1; ret->null.string = (char *) calloc (1, width); } } return ret; } static void morememory (struct Ebl_GStrtab *st, size_t len) { struct memoryblock *newmem; if (len < ps) len = ps; newmem = (struct memoryblock *) malloc (len); if (newmem == NULL) abort (); newmem->next = st->memory; st->memory = newmem; st->backp = newmem->memory; st->left = len - offsetof (struct memoryblock, memory); } void ebl_gstrtabfree (struct Ebl_GStrtab *st) { struct memoryblock *mb = st->memory; while (mb != NULL) { void *old = mb; mb = mb->next; free (old); } if (st->null.string != NULL) free ((char *) st->null.string); free (st); } static struct Ebl_GStrent * newstring (struct Ebl_GStrtab *st, const char *str, size_t len) { /* Compute the amount of padding needed to make the structure aligned. */ size_t align = ((__alignof__ (struct Ebl_GStrent) - (((uintptr_t) st->backp) & (__alignof__ (struct Ebl_GStrent) - 1))) & (__alignof__ (struct Ebl_GStrent) - 1)); /* Make sure there is enough room in the memory block. */ if (st->left < align + sizeof (struct Ebl_GStrent) + len * st->width) { morememory (st, sizeof (struct Ebl_GStrent) + len * st->width); align = 0; } /* Create the reserved string. */ struct Ebl_GStrent *newstr = (struct Ebl_GStrent *) (st->backp + align); newstr->string = str; newstr->len = len; newstr->width = st->width; newstr->next = NULL; newstr->left = NULL; newstr->right = NULL; newstr->offset = 0; for (int i = len - 2; i >= 0; --i) for (int j = st->width - 1; j >= 0; --j) newstr->reverse[i * st->width + j] = str[(len - 2 - i) * st->width + j]; for (size_t j = 0; j < st->width; ++j) newstr->reverse[(len - 1) * st->width + j] = '\0'; st->backp += align + sizeof (struct Ebl_GStrent) + len * st->width; st->left -= align + sizeof (struct Ebl_GStrent) + len * st->width; return newstr; } /* XXX This function should definitely be rewritten to use a balancing tree algorith (AVL, red-black trees). For now a simple, correct implementation is enough. */ static struct Ebl_GStrent ** searchstring (struct Ebl_GStrent **sep, struct Ebl_GStrent *newstr) { int cmpres; /* More strings? */ if (*sep == NULL) { *sep = newstr; return sep; } /* Compare the strings. */ cmpres = memcmp ((*sep)->reverse, newstr->reverse, (MIN ((*sep)->len, newstr->len) - 1) * (*sep)->width); if (cmpres == 0) /* We found a matching string. */ return sep; else if (cmpres > 0) return searchstring (&(*sep)->left, newstr); else return searchstring (&(*sep)->right, newstr); } /* Add new string. The actual string is assumed to be permanent. */ struct Ebl_GStrent * ebl_gstrtabadd (struct Ebl_GStrtab *st, const char *str, size_t len) { struct Ebl_GStrent *newstr; struct Ebl_GStrent **sep; /* Compute the string length if the caller doesn't know it. */ if (len == 0) { size_t j; do for (j = 0; j < st->width; ++j) if (str[len * st->width + j] != '\0') break; while (j == st->width && ++len); } /* Make sure all "" strings get offset 0 but only if the table was created with a special null entry in mind. */ if (len == 1 && st->null.string != NULL) return &st->null; /* Allocate memory for the new string and its associated information. */ newstr = newstring (st, str, len); /* Search in the array for the place to insert the string. If there is no string with matching prefix and no string with matching leading substring, create a new entry. */ sep = searchstring (&st->root, newstr); if (*sep != newstr) { /* This is not the same entry. This means we have a prefix match. */ if ((*sep)->len > newstr->len) { struct Ebl_GStrent *subs; /* Check whether we already know this string. */ for (subs = (*sep)->next; subs != NULL; subs = subs->next) if (subs->len == newstr->len) { /* We have an exact match with a substring. Free the memory we allocated. */ st->left += (st->backp - (char *) newstr) * st->width; st->backp = (char *) newstr; return subs; } /* We have a new substring. This means we don't need the reverse string of this entry anymore. */ st->backp -= newstr->len; st->left += newstr->len; newstr->next = (*sep)->next; (*sep)->next = newstr; } else if ((*sep)->len != newstr->len) { /* When we get here it means that the string we are about to add has a common prefix with a string we already have but it is longer. In this case we have to put it first. */ st->total += newstr->len - (*sep)->len; newstr->next = *sep; newstr->left = (*sep)->left; newstr->right = (*sep)->right; *sep = newstr; } else { /* We have an exact match. Free the memory we allocated. */ st->left += (st->backp - (char *) newstr) * st->width; st->backp = (char *) newstr; newstr = *sep; } } else st->total += newstr->len; return newstr; } static void copystrings (struct Ebl_GStrent *nodep, char **freep, size_t *offsetp) { struct Ebl_GStrent *subs; if (nodep->left != NULL) copystrings (nodep->left, freep, offsetp); /* Process the current node. */ nodep->offset = *offsetp; *freep = (char *) mempcpy (*freep, nodep->string, nodep->len * nodep->width); *offsetp += nodep->len * nodep->width; for (subs = nodep->next; subs != NULL; subs = subs->next) { assert (subs->len < nodep->len); subs->offset = nodep->offset + (nodep->len - subs->len) * nodep->width; assert (subs->offset != 0 || subs->string[0] == '\0'); } if (nodep->right != NULL) copystrings (nodep->right, freep, offsetp); } void ebl_gstrtabfinalize (struct Ebl_GStrtab *st, Elf_Data *data) { size_t copylen; char *endp; size_t nulllen = st->nullstr ? st->width : 0; /* Fill in the information. */ data->d_buf = malloc (st->total + nulllen); if (data->d_buf == NULL) abort (); /* The first byte must always be zero if we created the table with a null string. */ if (st->nullstr) memset (data->d_buf, '\0', st->width); data->d_type = ELF_T_BYTE; data->d_size = st->total + nulllen; data->d_off = 0; data->d_align = 1; data->d_version = EV_CURRENT; /* Now run through the tree and add all the string while also updating the offset members of the elfstrent records. */ endp = (char *) data->d_buf + nulllen; copylen = nulllen; copystrings (st->root, &endp, ©len); assert (copylen == st->total * st->width + nulllen); } size_t ebl_gstrtaboffset (struct Ebl_GStrent *se) { return se->offset; }