mirror of
https://github.com/bminor/binutils-gdb.git
synced 2025-11-16 12:34:43 +00:00
830 lines
24 KiB
C
830 lines
24 KiB
C
/* CTF string table management.
|
|
Copyright (C) 2019-2025 Free Software Foundation, Inc.
|
|
|
|
This file is part of libctf.
|
|
|
|
libctf is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free
|
|
Software Foundation; either version 3, or (at your option) any later
|
|
version.
|
|
|
|
This program is distributed in the hope that it will be useful, but
|
|
WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
|
See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; see the file COPYING. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include <assert.h>
|
|
#include <ctf-impl.h>
|
|
#include <string.h>
|
|
|
|
static ctf_str_atom_t *
|
|
ctf_str_add_ref_internal (ctf_dict_t *fp, const char *str,
|
|
int flags, uint32_t *ref);
|
|
|
|
/* Convert an encoded CTF string name into a pointer to a C string, possibly
|
|
using an explicit internal provisional strtab rather than the fp-based
|
|
one. */
|
|
const char *
|
|
ctf_strraw_explicit (ctf_dict_t *fp, uint32_t name, ctf_strs_t *strtab)
|
|
{
|
|
ctf_strs_t *ctsp = &fp->ctf_str[CTF_NAME_STID (name)];
|
|
|
|
if ((CTF_NAME_STID (name) == CTF_STRTAB_0) && (strtab != NULL))
|
|
ctsp = strtab;
|
|
|
|
/* If this name is in the external strtab, and there is a synthetic
|
|
strtab, use it in preference. (This is used to add the set of strings
|
|
-- symbol names, etc -- the linker knows about before the strtab is
|
|
written out.) */
|
|
|
|
if (CTF_NAME_STID (name) == CTF_STRTAB_1
|
|
&& fp->ctf_syn_ext_strtab != NULL)
|
|
return ctf_dynhash_lookup (fp->ctf_syn_ext_strtab,
|
|
(void *) (uintptr_t) name);
|
|
|
|
/* If the name is in the internal strtab, and the name offset is beyond
|
|
the end of the ctsp->cts_len but below the ctf_str_prov_offset, this is
|
|
a provisional string added by ctf_str_add*() but not yet built into a
|
|
real strtab: get the value out of the ctf_prov_strtab. */
|
|
|
|
if (CTF_NAME_STID (name) == CTF_STRTAB_0
|
|
&& name >= ctsp->cts_len && name < fp->ctf_str_prov_offset)
|
|
return ctf_dynhash_lookup (fp->ctf_prov_strtab,
|
|
(void *) (uintptr_t) name);
|
|
|
|
if (ctsp->cts_strs != NULL && CTF_NAME_OFFSET (name) < ctsp->cts_len)
|
|
return (ctsp->cts_strs + CTF_NAME_OFFSET (name));
|
|
|
|
/* String table not loaded or corrupt offset. */
|
|
return NULL;
|
|
}
|
|
|
|
/* Convert an encoded CTF string name into a pointer to a C string by looking
|
|
up the appropriate string table buffer and then adding the offset. */
|
|
const char *
|
|
ctf_strraw (ctf_dict_t *fp, uint32_t name)
|
|
{
|
|
return ctf_strraw_explicit (fp, name, NULL);
|
|
}
|
|
|
|
/* Return a guaranteed-non-NULL pointer to the string with the given CTF
|
|
name. */
|
|
const char *
|
|
ctf_strptr (ctf_dict_t *fp, uint32_t name)
|
|
{
|
|
const char *s = ctf_strraw (fp, name);
|
|
return (s != NULL ? s : "(?)");
|
|
}
|
|
|
|
/* As above, but return info on what is wrong in more detail.
|
|
(Used for type lookups.) */
|
|
|
|
const char *
|
|
ctf_strptr_validate (ctf_dict_t *fp, uint32_t name)
|
|
{
|
|
const char *str = ctf_strraw (fp, name);
|
|
|
|
if (str == NULL)
|
|
{
|
|
if (CTF_NAME_STID (name) == CTF_STRTAB_1
|
|
&& fp->ctf_syn_ext_strtab == NULL
|
|
&& fp->ctf_str[CTF_NAME_STID (name)].cts_strs == NULL)
|
|
{
|
|
ctf_set_errno (fp, ECTF_STRTAB);
|
|
return NULL;
|
|
}
|
|
|
|
ctf_set_errno (fp, ECTF_BADNAME);
|
|
return NULL;
|
|
}
|
|
return str;
|
|
}
|
|
|
|
/* Remove all refs to a given atom. */
|
|
static void
|
|
ctf_str_purge_atom_refs (ctf_str_atom_t *atom)
|
|
{
|
|
ctf_str_atom_ref_t *ref, *next;
|
|
ctf_str_atom_ref_movable_t *movref, *movnext;
|
|
|
|
for (ref = ctf_list_next (&atom->csa_refs); ref != NULL; ref = next)
|
|
{
|
|
next = ctf_list_next (ref);
|
|
ctf_list_delete (&atom->csa_refs, ref);
|
|
free (ref);
|
|
}
|
|
|
|
for (movref = ctf_list_next (&atom->csa_movable_refs);
|
|
movref != NULL; movref = movnext)
|
|
{
|
|
movnext = ctf_list_next (movref);
|
|
ctf_list_delete (&atom->csa_movable_refs, movref);
|
|
|
|
ctf_dynhash_remove (movref->caf_movable_refs, movref);
|
|
|
|
free (movref);
|
|
}
|
|
}
|
|
|
|
/* Free an atom. */
|
|
static void
|
|
ctf_str_free_atom (void *a)
|
|
{
|
|
ctf_str_atom_t *atom = a;
|
|
|
|
ctf_str_purge_atom_refs (atom);
|
|
|
|
if (atom->csa_flags & CTF_STR_ATOM_FREEABLE)
|
|
free (atom->csa_str);
|
|
|
|
free (atom);
|
|
}
|
|
|
|
/* Create the atoms table. There is always at least one atom in it, the null
|
|
string: but also pull in atoms from the internal strtab. (We rely on
|
|
calls to ctf_str_add_external to populate external strtab entries, since
|
|
these are often not quite the same as what appears in any external
|
|
strtab, and the external strtab is often huge and best not aggressively
|
|
pulled in.) */
|
|
int
|
|
ctf_str_create_atoms (ctf_dict_t *fp)
|
|
{
|
|
size_t i;
|
|
|
|
fp->ctf_str_atoms = ctf_dynhash_create (ctf_hash_string, ctf_hash_eq_string,
|
|
NULL, ctf_str_free_atom);
|
|
if (!fp->ctf_str_atoms)
|
|
return -ENOMEM;
|
|
|
|
if (!fp->ctf_prov_strtab)
|
|
fp->ctf_prov_strtab = ctf_dynhash_create (ctf_hash_integer,
|
|
ctf_hash_eq_integer,
|
|
NULL, NULL);
|
|
if (!fp->ctf_prov_strtab)
|
|
goto oom_prov_strtab;
|
|
|
|
fp->ctf_str_movable_refs = ctf_dynhash_create (ctf_hash_integer,
|
|
ctf_hash_eq_integer,
|
|
NULL, NULL);
|
|
if (!fp->ctf_str_movable_refs)
|
|
goto oom_movable_refs;
|
|
|
|
errno = 0;
|
|
ctf_str_add (fp, "");
|
|
if (errno == ENOMEM)
|
|
goto oom_str_add;
|
|
|
|
/* Pull in all the strings in the strtab as new atoms. The provisional
|
|
strtab must be empty at this point, so there is no need to populate
|
|
atoms from it as well. Types in this subset are frozen and readonly,
|
|
so the refs list and movable refs list need not be populated. */
|
|
|
|
for (i = 0; i < fp->ctf_str[CTF_STRTAB_0].cts_len;
|
|
i += strlen (&fp->ctf_str[CTF_STRTAB_0].cts_strs[i]) + 1)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
if (fp->ctf_str[CTF_STRTAB_0].cts_strs[i] == 0)
|
|
continue;
|
|
|
|
atom = ctf_str_add_ref_internal (fp, &fp->ctf_str[CTF_STRTAB_0].cts_strs[i],
|
|
0, 0);
|
|
|
|
if (!atom)
|
|
goto oom_str_add;
|
|
|
|
atom->csa_offset = i;
|
|
}
|
|
|
|
fp->ctf_str_prov_offset = fp->ctf_str[CTF_STRTAB_0].cts_len + 1;
|
|
|
|
return 0;
|
|
|
|
oom_str_add:
|
|
ctf_dynhash_destroy (fp->ctf_str_movable_refs);
|
|
fp->ctf_str_movable_refs = NULL;
|
|
oom_movable_refs:
|
|
ctf_dynhash_destroy (fp->ctf_prov_strtab);
|
|
fp->ctf_prov_strtab = NULL;
|
|
oom_prov_strtab:
|
|
ctf_dynhash_destroy (fp->ctf_str_atoms);
|
|
fp->ctf_str_atoms = NULL;
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Destroy the atoms table and associated refs. */
|
|
void
|
|
ctf_str_free_atoms (ctf_dict_t *fp)
|
|
{
|
|
ctf_dynhash_destroy (fp->ctf_prov_strtab);
|
|
ctf_dynhash_destroy (fp->ctf_str_atoms);
|
|
ctf_dynhash_destroy (fp->ctf_str_movable_refs);
|
|
if (fp->ctf_dynstrtab)
|
|
{
|
|
free (fp->ctf_dynstrtab->cts_strs);
|
|
free (fp->ctf_dynstrtab);
|
|
}
|
|
}
|
|
|
|
#define CTF_STR_ADD_REF 0x1
|
|
#define CTF_STR_PROVISIONAL 0x2
|
|
#define CTF_STR_MOVABLE 0x4
|
|
|
|
/* Allocate a ref and bind it into a ref list. */
|
|
|
|
static ctf_str_atom_ref_t *
|
|
aref_create (ctf_dict_t *fp, ctf_str_atom_t *atom, uint32_t *ref, int flags)
|
|
{
|
|
ctf_str_atom_ref_t *aref;
|
|
size_t s = sizeof (struct ctf_str_atom_ref);
|
|
|
|
if (flags & CTF_STR_MOVABLE)
|
|
s = sizeof (struct ctf_str_atom_ref_movable);
|
|
|
|
aref = malloc (s);
|
|
|
|
if (!aref)
|
|
return NULL;
|
|
|
|
aref->caf_ref = ref;
|
|
|
|
/* Movable refs get a backpointer to them in ctf_str_movable_refs, and a
|
|
pointer to ctf_str_movable_refs itself in the ref, for use when freeing
|
|
refs: they can be moved later in batches via a call to
|
|
ctf_str_move_refs. */
|
|
|
|
if (flags & CTF_STR_MOVABLE)
|
|
{
|
|
ctf_str_atom_ref_movable_t *movref = (ctf_str_atom_ref_movable_t *) aref;
|
|
|
|
movref->caf_movable_refs = fp->ctf_str_movable_refs;
|
|
|
|
if (ctf_dynhash_insert (fp->ctf_str_movable_refs, ref, aref) < 0)
|
|
{
|
|
free (aref);
|
|
return NULL;
|
|
}
|
|
ctf_list_append (&atom->csa_movable_refs, movref);
|
|
}
|
|
else
|
|
ctf_list_append (&atom->csa_refs, aref);
|
|
|
|
return aref;
|
|
}
|
|
|
|
/* Add a string to the atoms table, copying the passed-in string if
|
|
necessary. Return the atom added. Return NULL only when out of memory
|
|
(and do not touch the passed-in string in that case).
|
|
|
|
Possibly add a provisional entry for this string to the provisional
|
|
strtab. If the string is in the provisional strtab, update its ref list
|
|
with the passed-in ref, causing the ref to be updated when the strtab is
|
|
written out. */
|
|
|
|
static ctf_str_atom_t *
|
|
ctf_str_add_ref_internal (ctf_dict_t *fp, const char *str,
|
|
int flags, uint32_t *ref)
|
|
{
|
|
char *newstr = NULL;
|
|
ctf_str_atom_t *atom = NULL;
|
|
int added = 0;
|
|
|
|
atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str);
|
|
|
|
/* Existing atoms get refs added only if they are provisional:
|
|
non-provisional strings already have a fixed strtab offset, and just
|
|
get their ref updated immediately, since its value cannot change. */
|
|
|
|
if (atom)
|
|
{
|
|
if (!ctf_dynhash_lookup (fp->ctf_prov_strtab, (void *) (uintptr_t)
|
|
atom->csa_offset))
|
|
{
|
|
if (flags & CTF_STR_ADD_REF)
|
|
{
|
|
if (atom->csa_external_offset)
|
|
*ref = atom->csa_external_offset;
|
|
else
|
|
*ref = atom->csa_offset;
|
|
}
|
|
return atom;
|
|
}
|
|
|
|
if (flags & CTF_STR_ADD_REF)
|
|
{
|
|
if (!aref_create (fp, atom, ref, flags))
|
|
{
|
|
ctf_set_errno (fp, ENOMEM);
|
|
return NULL;
|
|
}
|
|
}
|
|
|
|
return atom;
|
|
}
|
|
|
|
/* New atom. */
|
|
|
|
if ((atom = malloc (sizeof (struct ctf_str_atom))) == NULL)
|
|
goto oom;
|
|
memset (atom, 0, sizeof (struct ctf_str_atom));
|
|
|
|
/* Don't allocate new strings if this string is within an mmapped
|
|
strtab. */
|
|
|
|
if ((unsigned char *) str < (unsigned char *) fp->ctf_data_mmapped
|
|
|| (unsigned char *) str > (unsigned char *) fp->ctf_data_mmapped + fp->ctf_data_mmapped_len)
|
|
{
|
|
if ((newstr = strdup (str)) == NULL)
|
|
goto oom;
|
|
atom->csa_flags |= CTF_STR_ATOM_FREEABLE;
|
|
atom->csa_str = newstr;
|
|
}
|
|
else
|
|
atom->csa_str = (char *) str;
|
|
|
|
if (ctf_dynhash_insert (fp->ctf_str_atoms, atom->csa_str, atom) < 0)
|
|
goto oom;
|
|
added = 1;
|
|
|
|
atom->csa_snapshot_id = fp->ctf_snapshots;
|
|
|
|
/* New atoms marked provisional go into the provisional strtab, and get a
|
|
ref added. */
|
|
|
|
if (flags & CTF_STR_PROVISIONAL)
|
|
{
|
|
atom->csa_offset = fp->ctf_str_prov_offset;
|
|
|
|
if (ctf_dynhash_insert (fp->ctf_prov_strtab, (void *) (uintptr_t)
|
|
atom->csa_offset, (void *) atom->csa_str) < 0)
|
|
goto oom;
|
|
|
|
fp->ctf_str_prov_offset += strlen (atom->csa_str) + 1;
|
|
|
|
if (flags & CTF_STR_ADD_REF)
|
|
{
|
|
if (!aref_create (fp, atom, ref, flags))
|
|
goto oom;
|
|
}
|
|
}
|
|
|
|
return atom;
|
|
|
|
oom:
|
|
if (added)
|
|
ctf_dynhash_remove (fp->ctf_str_atoms, atom->csa_str);
|
|
free (atom);
|
|
free (newstr);
|
|
ctf_set_errno (fp, ENOMEM);
|
|
return NULL;
|
|
}
|
|
|
|
/* Add a string to the atoms table, without augmenting the ref list for this
|
|
string: return a 'provisional offset' which can be used to return this string
|
|
until ctf_str_write_strtab is called, or 0 on failure. (Everywhere the
|
|
provisional offset is assigned to should be added as a ref using
|
|
ctf_str_add_ref() as well.) */
|
|
uint32_t
|
|
ctf_str_add (ctf_dict_t *fp, const char *str)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
if (!str)
|
|
str = "";
|
|
|
|
atom = ctf_str_add_ref_internal (fp, str, CTF_STR_PROVISIONAL, 0);
|
|
if (!atom)
|
|
return 0;
|
|
|
|
return atom->csa_offset;
|
|
}
|
|
|
|
/* Like ctf_str_add(), but additionally augment the atom's refs list with the
|
|
passed-in ref, whether or not the string is already present. There is no
|
|
attempt to deduplicate the refs list (but duplicates are harmless). */
|
|
uint32_t
|
|
ctf_str_add_ref (ctf_dict_t *fp, const char *str, uint32_t *ref)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
if (!str)
|
|
str = "";
|
|
|
|
atom = ctf_str_add_ref_internal (fp, str, CTF_STR_ADD_REF
|
|
| CTF_STR_PROVISIONAL, ref);
|
|
if (!atom)
|
|
return 0;
|
|
|
|
return atom->csa_offset;
|
|
}
|
|
|
|
/* Like ctf_str_add_ref(), but note that the ref may be moved later on. */
|
|
uint32_t
|
|
ctf_str_add_movable_ref (ctf_dict_t *fp, const char *str, uint32_t *ref)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
if (!str)
|
|
str = "";
|
|
|
|
atom = ctf_str_add_ref_internal (fp, str, CTF_STR_ADD_REF
|
|
| CTF_STR_PROVISIONAL
|
|
| CTF_STR_MOVABLE, ref);
|
|
if (!atom)
|
|
return 0;
|
|
|
|
return atom->csa_offset;
|
|
}
|
|
|
|
/* Add an external strtab reference at OFFSET. Returns zero if the addition
|
|
failed, nonzero otherwise. */
|
|
int
|
|
ctf_str_add_external (ctf_dict_t *fp, const char *str, uint32_t offset)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
if (!str)
|
|
str = "";
|
|
|
|
atom = ctf_str_add_ref_internal (fp, str, 0, 0);
|
|
if (!atom)
|
|
return 0;
|
|
|
|
atom->csa_external_offset = CTF_SET_STID (offset, CTF_STRTAB_1);
|
|
|
|
if (!fp->ctf_syn_ext_strtab)
|
|
fp->ctf_syn_ext_strtab = ctf_dynhash_create (ctf_hash_integer,
|
|
ctf_hash_eq_integer,
|
|
NULL, NULL);
|
|
if (!fp->ctf_syn_ext_strtab)
|
|
{
|
|
ctf_set_errno (fp, ENOMEM);
|
|
return 0;
|
|
}
|
|
|
|
if (ctf_dynhash_insert (fp->ctf_syn_ext_strtab,
|
|
(void *) (uintptr_t)
|
|
atom->csa_external_offset,
|
|
(void *) atom->csa_str) < 0)
|
|
{
|
|
/* No need to bother freeing the syn_ext_strtab: it will get freed at
|
|
ctf_str_write_strtab time if unreferenced. */
|
|
ctf_set_errno (fp, ENOMEM);
|
|
return 0;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
/* Note that refs have moved from (SRC, LEN) to DEST. We use the movable
|
|
refs backpointer for this, because it is done an amortized-constant
|
|
number of times during structure member and enumerand addition, and if we
|
|
did a linear search this would turn such addition into an O(n^2)
|
|
operation. Even this is not linear, but it's better than that. */
|
|
int
|
|
ctf_str_move_refs (ctf_dict_t *fp, void *src, size_t len, void *dest)
|
|
{
|
|
uintptr_t p;
|
|
|
|
if (src == dest)
|
|
return 0;
|
|
|
|
for (p = (uintptr_t) src; p - (uintptr_t) src < len; p++)
|
|
{
|
|
ctf_str_atom_ref_movable_t *ref;
|
|
|
|
if ((ref = ctf_dynhash_lookup (fp->ctf_str_movable_refs,
|
|
(ctf_str_atom_ref_t *) p)) != NULL)
|
|
{
|
|
int out_of_memory;
|
|
|
|
ref->caf_ref = (uint32_t *) (((uintptr_t) ref->caf_ref +
|
|
(uintptr_t) dest - (uintptr_t) src));
|
|
ctf_dynhash_remove (fp->ctf_str_movable_refs,
|
|
(ctf_str_atom_ref_t *) p);
|
|
out_of_memory = ctf_dynhash_insert (fp->ctf_str_movable_refs,
|
|
ref->caf_ref, ref);
|
|
assert (out_of_memory == 0);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* Remove a single ref. */
|
|
void
|
|
ctf_str_remove_ref (ctf_dict_t *fp, const char *str, uint32_t *ref)
|
|
{
|
|
ctf_str_atom_ref_t *aref, *anext;
|
|
ctf_str_atom_ref_movable_t *amovref, *amovnext;
|
|
ctf_str_atom_t *atom = NULL;
|
|
|
|
atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str);
|
|
if (!atom)
|
|
return;
|
|
|
|
for (aref = ctf_list_next (&atom->csa_refs); aref != NULL; aref = anext)
|
|
{
|
|
anext = ctf_list_next (aref);
|
|
if (aref->caf_ref == ref)
|
|
{
|
|
ctf_list_delete (&atom->csa_refs, aref);
|
|
free (aref);
|
|
}
|
|
}
|
|
|
|
for (amovref = ctf_list_next (&atom->csa_movable_refs);
|
|
amovref != NULL; amovref = amovnext)
|
|
{
|
|
amovnext = ctf_list_next (amovref);
|
|
if (amovref->caf_ref == ref)
|
|
{
|
|
ctf_list_delete (&atom->csa_movable_refs, amovref);
|
|
ctf_dynhash_remove (fp->ctf_str_movable_refs, ref);
|
|
free (amovref);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* A ctf_dynhash_iter_remove() callback that removes atoms later than a given
|
|
snapshot ID. External atoms are never removed, because they came from the
|
|
linker string table and are still present even if you roll back type
|
|
additions. */
|
|
static int
|
|
ctf_str_rollback_atom (void *key _libctf_unused_, void *value, void *arg)
|
|
{
|
|
ctf_str_atom_t *atom = (ctf_str_atom_t *) value;
|
|
ctf_snapshot_id_t *id = (ctf_snapshot_id_t *) arg;
|
|
|
|
return (atom->csa_snapshot_id > id->snapshot_id)
|
|
&& (atom->csa_external_offset == 0);
|
|
}
|
|
|
|
/* Roll back, deleting all (internal) atoms created after a particular ID. */
|
|
void
|
|
ctf_str_rollback (ctf_dict_t *fp, ctf_snapshot_id_t id)
|
|
{
|
|
ctf_dynhash_iter_remove (fp->ctf_str_atoms, ctf_str_rollback_atom, &id);
|
|
}
|
|
|
|
/* An adaptor around ctf_purge_atom_refs. */
|
|
static void
|
|
ctf_str_purge_one_atom_refs (void *key _libctf_unused_, void *value,
|
|
void *arg _libctf_unused_)
|
|
{
|
|
ctf_str_atom_t *atom = (ctf_str_atom_t *) value;
|
|
|
|
ctf_str_purge_atom_refs (atom);
|
|
}
|
|
|
|
/* Remove all the recorded refs from the atoms table. */
|
|
static void
|
|
ctf_str_purge_refs (ctf_dict_t *fp)
|
|
{
|
|
ctf_dynhash_iter (fp->ctf_str_atoms, ctf_str_purge_one_atom_refs, NULL);
|
|
}
|
|
|
|
/* Update a list of refs to the specified value. */
|
|
static void
|
|
ctf_str_update_refs (ctf_str_atom_t *refs, uint32_t value)
|
|
{
|
|
ctf_str_atom_ref_t *ref;
|
|
ctf_str_atom_ref_movable_t *movref;
|
|
|
|
for (ref = ctf_list_next (&refs->csa_refs); ref != NULL;
|
|
ref = ctf_list_next (ref))
|
|
*(ref->caf_ref) = value;
|
|
|
|
for (movref = ctf_list_next (&refs->csa_movable_refs);
|
|
movref != NULL; movref = ctf_list_next (movref))
|
|
*(movref->caf_ref) = value;
|
|
}
|
|
|
|
/* Sort the strtab. */
|
|
static int
|
|
ctf_str_sort_strtab (const void *a, const void *b)
|
|
{
|
|
ctf_str_atom_t **one = (ctf_str_atom_t **) a;
|
|
ctf_str_atom_t **two = (ctf_str_atom_t **) b;
|
|
|
|
return (strcmp ((*one)->csa_str, (*two)->csa_str));
|
|
}
|
|
|
|
/* Write out and return a strtab containing all strings with recorded refs,
|
|
adjusting the refs to refer to the corresponding string. The returned
|
|
strtab is already assigned to strtab 0 in this dict, is owned by this
|
|
dict, and may be NULL on error. Also populate the synthetic strtab with
|
|
mappings from external strtab offsets to names, so we can look them up
|
|
with ctf_strptr(). Only external strtab offsets with references are
|
|
added.
|
|
|
|
As a side effect, replaces the strtab of the current dict with the newly-
|
|
generated strtab. This is an exception to the general rule that
|
|
serialization does not change the dict passed in, because the alternative
|
|
is to copy the entire atoms table on every reserialization just to avoid
|
|
modifying the original, which is excessively costly for minimal gain.
|
|
|
|
We use the lazy man's approach and double memory costs by always storing
|
|
atoms as individually allocated entities whenever they come from anywhere
|
|
but a freshly-opened, mmapped dict, even though after serialization there
|
|
is another copy in the strtab; this ensures that ctf_strptr()-returned
|
|
pointers to them remain valid for the lifetime of the dict.
|
|
|
|
This is all rendered more complex because if a dict is ctf_open()ed it
|
|
will have a bunch of strings in its strtab already, and their strtab
|
|
offsets can never change (without piles of complexity to rescan the
|
|
entire dict just to get all the offsets to all of them into the atoms
|
|
table). Entries below the existing strtab limit are just copied into the
|
|
new dict: entries above it are new, and are are sorted first, then
|
|
appended to it. The sorting is purely a compression-efficiency
|
|
improvement, and we get nearly as good an improvement from sorting big
|
|
chunks like this as we would from sorting the whole thing. */
|
|
|
|
const ctf_strs_writable_t *
|
|
ctf_str_write_strtab (ctf_dict_t *fp)
|
|
{
|
|
ctf_strs_writable_t *strtab;
|
|
size_t strtab_count = 0;
|
|
uint32_t cur_stroff = 0;
|
|
ctf_str_atom_t **sorttab;
|
|
ctf_next_t *it = NULL;
|
|
size_t i;
|
|
void *v;
|
|
int err;
|
|
int new_strtab = 0;
|
|
int any_external = 0;
|
|
|
|
strtab = calloc (1, sizeof (ctf_strs_writable_t));
|
|
if (!strtab)
|
|
return NULL;
|
|
|
|
/* The strtab contains the existing string table at its start: figure out
|
|
how many new strings we need to add. We only need to add new strings
|
|
that have no external offset, that have refs, and that are found in the
|
|
provisional strtab. If the existing strtab is empty we also need to
|
|
add the null string at its start. */
|
|
|
|
strtab->cts_len = fp->ctf_str[CTF_STRTAB_0].cts_len;
|
|
|
|
if (strtab->cts_len == 0)
|
|
{
|
|
new_strtab = 1;
|
|
strtab->cts_len++; /* For the \0. */
|
|
}
|
|
|
|
/* Count new entries in the strtab: i.e. entries in the provisional
|
|
strtab. Ignore any entry for \0, entries which ended up in the
|
|
external strtab, and unreferenced entries. */
|
|
|
|
while ((err = ctf_dynhash_next (fp->ctf_prov_strtab, &it, NULL, &v)) == 0)
|
|
{
|
|
const char *str = (const char *) v;
|
|
ctf_str_atom_t *atom;
|
|
|
|
atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str);
|
|
if (!ctf_assert (fp, atom))
|
|
goto err_strtab;
|
|
|
|
if (atom->csa_str[0] == 0 || atom->csa_external_offset
|
|
|| (ctf_list_empty_p (&atom->csa_refs)
|
|
&& ctf_list_empty_p (&atom->csa_movable_refs)))
|
|
continue;
|
|
|
|
strtab->cts_len += strlen (atom->csa_str) + 1;
|
|
strtab_count++;
|
|
}
|
|
if (err != ECTF_NEXT_END)
|
|
{
|
|
ctf_dprintf ("ctf_str_write_strtab: error counting strtab entries: %s\n",
|
|
ctf_errmsg (err));
|
|
goto err_strtab;
|
|
}
|
|
|
|
ctf_dprintf ("%lu bytes of strings in strtab: %lu pre-existing.\n",
|
|
(unsigned long) strtab->cts_len,
|
|
(unsigned long) fp->ctf_str[CTF_STRTAB_0].cts_len);
|
|
|
|
/* Sort the new part of the strtab. */
|
|
|
|
sorttab = calloc (strtab_count, sizeof (ctf_str_atom_t *));
|
|
if (!sorttab)
|
|
{
|
|
ctf_set_errno (fp, ENOMEM);
|
|
goto err_strtab;
|
|
}
|
|
|
|
i = 0;
|
|
while ((err = ctf_dynhash_next (fp->ctf_prov_strtab, &it, NULL, &v)) == 0)
|
|
{
|
|
ctf_str_atom_t *atom;
|
|
|
|
atom = ctf_dynhash_lookup (fp->ctf_str_atoms, v);
|
|
if (!ctf_assert (fp, atom))
|
|
goto err_sorttab;
|
|
|
|
if (atom->csa_str[0] == 0 || atom->csa_external_offset
|
|
|| (ctf_list_empty_p (&atom->csa_refs)
|
|
&& ctf_list_empty_p (&atom->csa_movable_refs)))
|
|
continue;
|
|
|
|
sorttab[i++] = atom;
|
|
}
|
|
|
|
qsort (sorttab, strtab_count, sizeof (ctf_str_atom_t *),
|
|
ctf_str_sort_strtab);
|
|
|
|
if ((strtab->cts_strs = malloc (strtab->cts_len)) == NULL)
|
|
goto err_sorttab;
|
|
|
|
cur_stroff = fp->ctf_str[CTF_STRTAB_0].cts_len;
|
|
|
|
if (new_strtab)
|
|
{
|
|
strtab->cts_strs[0] = 0;
|
|
cur_stroff++;
|
|
}
|
|
else
|
|
memcpy (strtab->cts_strs, fp->ctf_str[CTF_STRTAB_0].cts_strs,
|
|
fp->ctf_str[CTF_STRTAB_0].cts_len);
|
|
|
|
/* Work over the sorttab, add its strings to the strtab, and remember
|
|
where they are in the csa_offset for the appropriate atom. No ref
|
|
updating is done at this point, because refs might well relate to
|
|
already-existing strings, or external strings, which do not need adding
|
|
to the strtab and may not be in the sorttab. */
|
|
|
|
for (i = 0; i < strtab_count; i++)
|
|
{
|
|
sorttab[i]->csa_offset = cur_stroff;
|
|
strcpy (&strtab->cts_strs[cur_stroff], sorttab[i]->csa_str);
|
|
cur_stroff += strlen (sorttab[i]->csa_str) + 1;
|
|
}
|
|
free (sorttab);
|
|
sorttab = NULL;
|
|
|
|
/* Update all refs, then purge them as no longer necessary: also update
|
|
the strtab appropriately. */
|
|
|
|
while ((err = ctf_dynhash_next (fp->ctf_str_atoms, &it, NULL, &v)) == 0)
|
|
{
|
|
ctf_str_atom_t *atom = (ctf_str_atom_t *) v;
|
|
uint32_t offset;
|
|
|
|
if (ctf_list_empty_p (&atom->csa_refs) &&
|
|
ctf_list_empty_p (&atom->csa_movable_refs))
|
|
continue;
|
|
|
|
if (atom->csa_external_offset)
|
|
{
|
|
any_external = 1;
|
|
offset = atom->csa_external_offset;
|
|
}
|
|
else
|
|
offset = atom->csa_offset;
|
|
ctf_str_update_refs (atom, offset);
|
|
}
|
|
if (err != ECTF_NEXT_END)
|
|
{
|
|
ctf_dprintf ("ctf_str_write_strtab: error iterating over atoms while updating refs: %s\n",
|
|
ctf_errmsg (err));
|
|
goto err_strtab;
|
|
}
|
|
ctf_str_purge_refs (fp);
|
|
|
|
if (!any_external)
|
|
{
|
|
ctf_dynhash_destroy (fp->ctf_syn_ext_strtab);
|
|
fp->ctf_syn_ext_strtab = NULL;
|
|
}
|
|
|
|
/* Replace the old strtab with the new one in this dict. */
|
|
|
|
if (fp->ctf_dynstrtab)
|
|
{
|
|
free (fp->ctf_dynstrtab->cts_strs);
|
|
free (fp->ctf_dynstrtab);
|
|
}
|
|
|
|
fp->ctf_dynstrtab = strtab;
|
|
fp->ctf_str[CTF_STRTAB_0].cts_strs = strtab->cts_strs;
|
|
fp->ctf_str[CTF_STRTAB_0].cts_len = strtab->cts_len;
|
|
|
|
/* All the provisional strtab entries are now real strtab entries, and
|
|
ctf_strptr() will find them there. The provisional offset now starts right
|
|
beyond the new end of the strtab. */
|
|
|
|
ctf_dynhash_empty (fp->ctf_prov_strtab);
|
|
fp->ctf_str_prov_offset = strtab->cts_len + 1;
|
|
return strtab;
|
|
|
|
err_sorttab:
|
|
free (sorttab);
|
|
err_strtab:
|
|
free (strtab);
|
|
return NULL;
|
|
}
|