|  | /* CTF string table management. | 
|  | Copyright (C) 2019-2025 Free Software Foundation, Inc. | 
|  |  | 
|  | This file is part of libctf. | 
|  |  | 
|  | libctf is free software; you can redistribute it and/or modify it under | 
|  | the terms of the GNU General Public License as published by the Free | 
|  | Software Foundation; either version 3, or (at your option) any later | 
|  | version. | 
|  |  | 
|  | This program is distributed in the hope that it will be useful, but | 
|  | WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. | 
|  | See the GNU General Public License for more details. | 
|  |  | 
|  | You should have received a copy of the GNU General Public License | 
|  | along with this program; see the file COPYING.  If not see | 
|  | <http://www.gnu.org/licenses/>.  */ | 
|  |  | 
|  | #include <assert.h> | 
|  | #include <ctf-impl.h> | 
|  | #include <string.h> | 
|  |  | 
|  | static ctf_str_atom_t * | 
|  | ctf_str_add_ref_internal (ctf_dict_t *fp, const char *str, | 
|  | int flags, uint32_t *ref); | 
|  |  | 
|  | /* Convert an encoded CTF string name into a pointer to a C string, possibly | 
|  | using an explicit internal provisional strtab rather than the fp-based | 
|  | one.  */ | 
|  | const char * | 
|  | ctf_strraw_explicit (ctf_dict_t *fp, uint32_t name, ctf_strs_t *strtab) | 
|  | { | 
|  | ctf_strs_t *ctsp = &fp->ctf_str[CTF_NAME_STID (name)]; | 
|  |  | 
|  | if ((CTF_NAME_STID (name) == CTF_STRTAB_0) && (strtab != NULL)) | 
|  | ctsp = strtab; | 
|  |  | 
|  | /* If this name is in the external strtab, and there is a synthetic | 
|  | strtab, use it in preference.  (This is used to add the set of strings | 
|  | -- symbol names, etc -- the linker knows about before the strtab is | 
|  | written out.)  */ | 
|  |  | 
|  | if (CTF_NAME_STID (name) == CTF_STRTAB_1 | 
|  | && fp->ctf_syn_ext_strtab != NULL) | 
|  | return ctf_dynhash_lookup (fp->ctf_syn_ext_strtab, | 
|  | (void *) (uintptr_t) name); | 
|  |  | 
|  | /* If the name is in the internal strtab, and the name offset is beyond | 
|  | the end of the ctsp->cts_len but below the ctf_str_prov_offset, this is | 
|  | a provisional string added by ctf_str_add*() but not yet built into a | 
|  | real strtab: get the value out of the ctf_prov_strtab.  */ | 
|  |  | 
|  | if (CTF_NAME_STID (name) == CTF_STRTAB_0 | 
|  | && name >= ctsp->cts_len && name < fp->ctf_str_prov_offset) | 
|  | return ctf_dynhash_lookup (fp->ctf_prov_strtab, | 
|  | (void *) (uintptr_t) name); | 
|  |  | 
|  | if (ctsp->cts_strs != NULL && CTF_NAME_OFFSET (name) < ctsp->cts_len) | 
|  | return (ctsp->cts_strs + CTF_NAME_OFFSET (name)); | 
|  |  | 
|  | /* String table not loaded or corrupt offset.  */ | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | /* Convert an encoded CTF string name into a pointer to a C string by looking | 
|  | up the appropriate string table buffer and then adding the offset.  */ | 
|  | const char * | 
|  | ctf_strraw (ctf_dict_t *fp, uint32_t name) | 
|  | { | 
|  | return ctf_strraw_explicit (fp, name, NULL); | 
|  | } | 
|  |  | 
|  | /* Return a guaranteed-non-NULL pointer to the string with the given CTF | 
|  | name.  */ | 
|  | const char * | 
|  | ctf_strptr (ctf_dict_t *fp, uint32_t name) | 
|  | { | 
|  | const char *s = ctf_strraw (fp, name); | 
|  | return (s != NULL ? s : "(?)"); | 
|  | } | 
|  |  | 
|  | /* As above, but return info on what is wrong in more detail. | 
|  | (Used for type lookups.) */ | 
|  |  | 
|  | const char * | 
|  | ctf_strptr_validate (ctf_dict_t *fp, uint32_t name) | 
|  | { | 
|  | const char *str = ctf_strraw (fp, name); | 
|  |  | 
|  | if (str == NULL) | 
|  | { | 
|  | if (CTF_NAME_STID (name) == CTF_STRTAB_1 | 
|  | && fp->ctf_syn_ext_strtab == NULL | 
|  | && fp->ctf_str[CTF_NAME_STID (name)].cts_strs == NULL) | 
|  | { | 
|  | ctf_set_errno (fp, ECTF_STRTAB); | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | ctf_set_errno (fp, ECTF_BADNAME); | 
|  | return NULL; | 
|  | } | 
|  | return str; | 
|  | } | 
|  |  | 
|  | /* Remove all refs to a given atom.  */ | 
|  | static void | 
|  | ctf_str_purge_atom_refs (ctf_str_atom_t *atom) | 
|  | { | 
|  | ctf_str_atom_ref_t *ref, *next; | 
|  | ctf_str_atom_ref_movable_t *movref, *movnext; | 
|  |  | 
|  | for (ref = ctf_list_next (&atom->csa_refs); ref != NULL; ref = next) | 
|  | { | 
|  | next = ctf_list_next (ref); | 
|  | ctf_list_delete (&atom->csa_refs, ref); | 
|  | free (ref); | 
|  | } | 
|  |  | 
|  | for (movref = ctf_list_next (&atom->csa_movable_refs); | 
|  | movref != NULL; movref = movnext) | 
|  | { | 
|  | movnext = ctf_list_next (movref); | 
|  | ctf_list_delete (&atom->csa_movable_refs, movref); | 
|  |  | 
|  | ctf_dynhash_remove (movref->caf_movable_refs, movref); | 
|  |  | 
|  | free (movref); | 
|  | } | 
|  | } | 
|  |  | 
|  | /* Free an atom.  */ | 
|  | static void | 
|  | ctf_str_free_atom (void *a) | 
|  | { | 
|  | ctf_str_atom_t *atom = a; | 
|  |  | 
|  | ctf_str_purge_atom_refs (atom); | 
|  |  | 
|  | if (atom->csa_flags & CTF_STR_ATOM_FREEABLE) | 
|  | free (atom->csa_str); | 
|  |  | 
|  | free (atom); | 
|  | } | 
|  |  | 
|  | /* Create the atoms table.  There is always at least one atom in it, the null | 
|  | string: but also pull in atoms from the internal strtab.  (We rely on | 
|  | calls to ctf_str_add_external to populate external strtab entries, since | 
|  | these are often not quite the same as what appears in any external | 
|  | strtab, and the external strtab is often huge and best not aggressively | 
|  | pulled in.)  */ | 
|  | int | 
|  | ctf_str_create_atoms (ctf_dict_t *fp) | 
|  | { | 
|  | size_t i; | 
|  |  | 
|  | fp->ctf_str_atoms = ctf_dynhash_create (ctf_hash_string, ctf_hash_eq_string, | 
|  | NULL, ctf_str_free_atom); | 
|  | if (!fp->ctf_str_atoms) | 
|  | return -ENOMEM; | 
|  |  | 
|  | if (!fp->ctf_prov_strtab) | 
|  | fp->ctf_prov_strtab = ctf_dynhash_create (ctf_hash_integer, | 
|  | ctf_hash_eq_integer, | 
|  | NULL, NULL); | 
|  | if (!fp->ctf_prov_strtab) | 
|  | goto oom_prov_strtab; | 
|  |  | 
|  | fp->ctf_str_movable_refs = ctf_dynhash_create (ctf_hash_integer, | 
|  | ctf_hash_eq_integer, | 
|  | NULL, NULL); | 
|  | if (!fp->ctf_str_movable_refs) | 
|  | goto oom_movable_refs; | 
|  |  | 
|  | errno = 0; | 
|  | ctf_str_add (fp, ""); | 
|  | if (errno == ENOMEM) | 
|  | goto oom_str_add; | 
|  |  | 
|  | /* Pull in all the strings in the strtab as new atoms.  The provisional | 
|  | strtab must be empty at this point, so there is no need to populate | 
|  | atoms from it as well.  Types in this subset are frozen and readonly, | 
|  | so the refs list and movable refs list need not be populated.  */ | 
|  |  | 
|  | for (i = 0; i < fp->ctf_str[CTF_STRTAB_0].cts_len; | 
|  | i += strlen (&fp->ctf_str[CTF_STRTAB_0].cts_strs[i]) + 1) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | if (fp->ctf_str[CTF_STRTAB_0].cts_strs[i] == 0) | 
|  | continue; | 
|  |  | 
|  | atom = ctf_str_add_ref_internal (fp, &fp->ctf_str[CTF_STRTAB_0].cts_strs[i], | 
|  | 0, 0); | 
|  |  | 
|  | if (!atom) | 
|  | goto oom_str_add; | 
|  |  | 
|  | atom->csa_offset = i; | 
|  | } | 
|  |  | 
|  | fp->ctf_str_prov_offset = fp->ctf_str[CTF_STRTAB_0].cts_len + 1; | 
|  |  | 
|  | return 0; | 
|  |  | 
|  | oom_str_add: | 
|  | ctf_dynhash_destroy (fp->ctf_str_movable_refs); | 
|  | fp->ctf_str_movable_refs = NULL; | 
|  | oom_movable_refs: | 
|  | ctf_dynhash_destroy (fp->ctf_prov_strtab); | 
|  | fp->ctf_prov_strtab = NULL; | 
|  | oom_prov_strtab: | 
|  | ctf_dynhash_destroy (fp->ctf_str_atoms); | 
|  | fp->ctf_str_atoms = NULL; | 
|  | return -ENOMEM; | 
|  | } | 
|  |  | 
|  | /* Destroy the atoms table and associated refs.  */ | 
|  | void | 
|  | ctf_str_free_atoms (ctf_dict_t *fp) | 
|  | { | 
|  | ctf_dynhash_destroy (fp->ctf_prov_strtab); | 
|  | ctf_dynhash_destroy (fp->ctf_str_atoms); | 
|  | ctf_dynhash_destroy (fp->ctf_str_movable_refs); | 
|  | if (fp->ctf_dynstrtab) | 
|  | { | 
|  | free (fp->ctf_dynstrtab->cts_strs); | 
|  | free (fp->ctf_dynstrtab); | 
|  | } | 
|  | } | 
|  |  | 
|  | #define CTF_STR_ADD_REF 0x1 | 
|  | #define CTF_STR_PROVISIONAL 0x2 | 
|  | #define CTF_STR_MOVABLE 0x4 | 
|  |  | 
|  | /* Allocate a ref and bind it into a ref list.  */ | 
|  |  | 
|  | static ctf_str_atom_ref_t * | 
|  | aref_create (ctf_dict_t *fp, ctf_str_atom_t *atom, uint32_t *ref, int flags) | 
|  | { | 
|  | ctf_str_atom_ref_t *aref; | 
|  | size_t s = sizeof (struct ctf_str_atom_ref); | 
|  |  | 
|  | if (flags & CTF_STR_MOVABLE) | 
|  | s = sizeof (struct ctf_str_atom_ref_movable); | 
|  |  | 
|  | aref = malloc (s); | 
|  |  | 
|  | if (!aref) | 
|  | return NULL; | 
|  |  | 
|  | aref->caf_ref = ref; | 
|  |  | 
|  | /* Movable refs get a backpointer to them in ctf_str_movable_refs, and a | 
|  | pointer to ctf_str_movable_refs itself in the ref, for use when freeing | 
|  | refs: they can be moved later in batches via a call to | 
|  | ctf_str_move_refs.  */ | 
|  |  | 
|  | if (flags & CTF_STR_MOVABLE) | 
|  | { | 
|  | ctf_str_atom_ref_movable_t *movref = (ctf_str_atom_ref_movable_t *) aref; | 
|  |  | 
|  | movref->caf_movable_refs = fp->ctf_str_movable_refs; | 
|  |  | 
|  | if (ctf_dynhash_insert (fp->ctf_str_movable_refs, ref, aref) < 0) | 
|  | { | 
|  | free (aref); | 
|  | return NULL; | 
|  | } | 
|  | ctf_list_append (&atom->csa_movable_refs, movref); | 
|  | } | 
|  | else | 
|  | ctf_list_append (&atom->csa_refs, aref); | 
|  |  | 
|  | return aref; | 
|  | } | 
|  |  | 
|  | /* Add a string to the atoms table, copying the passed-in string if | 
|  | necessary.  Return the atom added. Return NULL only when out of memory | 
|  | (and do not touch the passed-in string in that case). | 
|  |  | 
|  | Possibly add a provisional entry for this string to the provisional | 
|  | strtab.  If the string is in the provisional strtab, update its ref list | 
|  | with the passed-in ref, causing the ref to be updated when the strtab is | 
|  | written out.  */ | 
|  |  | 
|  | static ctf_str_atom_t * | 
|  | ctf_str_add_ref_internal (ctf_dict_t *fp, const char *str, | 
|  | int flags, uint32_t *ref) | 
|  | { | 
|  | char *newstr = NULL; | 
|  | ctf_str_atom_t *atom = NULL; | 
|  | int added = 0; | 
|  |  | 
|  | atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str); | 
|  |  | 
|  | /* Existing atoms get refs added only if they are provisional: | 
|  | non-provisional strings already have a fixed strtab offset, and just | 
|  | get their ref updated immediately, since its value cannot change.  */ | 
|  |  | 
|  | if (atom) | 
|  | { | 
|  | if (!ctf_dynhash_lookup (fp->ctf_prov_strtab, (void *) (uintptr_t) | 
|  | atom->csa_offset)) | 
|  | { | 
|  | if (flags & CTF_STR_ADD_REF) | 
|  | { | 
|  | if (atom->csa_external_offset) | 
|  | *ref = atom->csa_external_offset; | 
|  | else | 
|  | *ref = atom->csa_offset; | 
|  | } | 
|  | return atom; | 
|  | } | 
|  |  | 
|  | if (flags & CTF_STR_ADD_REF) | 
|  | { | 
|  | if (!aref_create (fp, atom, ref, flags)) | 
|  | { | 
|  | ctf_set_errno (fp, ENOMEM); | 
|  | return NULL; | 
|  | } | 
|  | } | 
|  |  | 
|  | return atom; | 
|  | } | 
|  |  | 
|  | /* New atom.  */ | 
|  |  | 
|  | if ((atom = malloc (sizeof (struct ctf_str_atom))) == NULL) | 
|  | goto oom; | 
|  | memset (atom, 0, sizeof (struct ctf_str_atom)); | 
|  |  | 
|  | /* Don't allocate new strings if this string is within an mmapped | 
|  | strtab.  */ | 
|  |  | 
|  | if ((unsigned char *) str < (unsigned char *) fp->ctf_data_mmapped | 
|  | || (unsigned char *) str > (unsigned char *) fp->ctf_data_mmapped + fp->ctf_data_mmapped_len) | 
|  | { | 
|  | if ((newstr = strdup (str)) == NULL) | 
|  | goto oom; | 
|  | atom->csa_flags |= CTF_STR_ATOM_FREEABLE; | 
|  | atom->csa_str = newstr; | 
|  | } | 
|  | else | 
|  | atom->csa_str = (char *) str; | 
|  |  | 
|  | if (ctf_dynhash_insert (fp->ctf_str_atoms, atom->csa_str, atom) < 0) | 
|  | goto oom; | 
|  | added = 1; | 
|  |  | 
|  | atom->csa_snapshot_id = fp->ctf_snapshots; | 
|  |  | 
|  | /* New atoms marked provisional go into the provisional strtab, and get a | 
|  | ref added.  */ | 
|  |  | 
|  | if (flags & CTF_STR_PROVISIONAL) | 
|  | { | 
|  | atom->csa_offset = fp->ctf_str_prov_offset; | 
|  |  | 
|  | if (ctf_dynhash_insert (fp->ctf_prov_strtab, (void *) (uintptr_t) | 
|  | atom->csa_offset, (void *) atom->csa_str) < 0) | 
|  | goto oom; | 
|  |  | 
|  | fp->ctf_str_prov_offset += strlen (atom->csa_str) + 1; | 
|  |  | 
|  | if (flags & CTF_STR_ADD_REF) | 
|  | { | 
|  | if (!aref_create (fp, atom, ref, flags)) | 
|  | goto oom; | 
|  | } | 
|  | } | 
|  |  | 
|  | return atom; | 
|  |  | 
|  | oom: | 
|  | if (added) | 
|  | ctf_dynhash_remove (fp->ctf_str_atoms, atom->csa_str); | 
|  | free (atom); | 
|  | free (newstr); | 
|  | ctf_set_errno (fp, ENOMEM); | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | /* Add a string to the atoms table, without augmenting the ref list for this | 
|  | string: return a 'provisional offset' which can be used to return this string | 
|  | until ctf_str_write_strtab is called, or 0 on failure.  (Everywhere the | 
|  | provisional offset is assigned to should be added as a ref using | 
|  | ctf_str_add_ref() as well.) */ | 
|  | uint32_t | 
|  | ctf_str_add (ctf_dict_t *fp, const char *str) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | if (!str) | 
|  | str = ""; | 
|  |  | 
|  | atom = ctf_str_add_ref_internal (fp, str, CTF_STR_PROVISIONAL, 0); | 
|  | if (!atom) | 
|  | return 0; | 
|  |  | 
|  | return atom->csa_offset; | 
|  | } | 
|  |  | 
|  | /* Like ctf_str_add(), but additionally augment the atom's refs list with the | 
|  | passed-in ref, whether or not the string is already present.  There is no | 
|  | attempt to deduplicate the refs list (but duplicates are harmless).  */ | 
|  | uint32_t | 
|  | ctf_str_add_ref (ctf_dict_t *fp, const char *str, uint32_t *ref) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | if (!str) | 
|  | str = ""; | 
|  |  | 
|  | atom = ctf_str_add_ref_internal (fp, str, CTF_STR_ADD_REF | 
|  | | CTF_STR_PROVISIONAL, ref); | 
|  | if (!atom) | 
|  | return 0; | 
|  |  | 
|  | return atom->csa_offset; | 
|  | } | 
|  |  | 
|  | /* Like ctf_str_add_ref(), but note that the ref may be moved later on.  */ | 
|  | uint32_t | 
|  | ctf_str_add_movable_ref (ctf_dict_t *fp, const char *str, uint32_t *ref) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | if (!str) | 
|  | str = ""; | 
|  |  | 
|  | atom = ctf_str_add_ref_internal (fp, str, CTF_STR_ADD_REF | 
|  | | CTF_STR_PROVISIONAL | 
|  | | CTF_STR_MOVABLE, ref); | 
|  | if (!atom) | 
|  | return 0; | 
|  |  | 
|  | return atom->csa_offset; | 
|  | } | 
|  |  | 
|  | /* Add an external strtab reference at OFFSET.  Returns zero if the addition | 
|  | failed, nonzero otherwise.  */ | 
|  | int | 
|  | ctf_str_add_external (ctf_dict_t *fp, const char *str, uint32_t offset) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | if (!str) | 
|  | str = ""; | 
|  |  | 
|  | atom = ctf_str_add_ref_internal (fp, str, 0, 0); | 
|  | if (!atom) | 
|  | return 0; | 
|  |  | 
|  | atom->csa_external_offset = CTF_SET_STID (offset, CTF_STRTAB_1); | 
|  |  | 
|  | if (!fp->ctf_syn_ext_strtab) | 
|  | fp->ctf_syn_ext_strtab = ctf_dynhash_create (ctf_hash_integer, | 
|  | ctf_hash_eq_integer, | 
|  | NULL, NULL); | 
|  | if (!fp->ctf_syn_ext_strtab) | 
|  | { | 
|  | ctf_set_errno (fp, ENOMEM); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | if (ctf_dynhash_insert (fp->ctf_syn_ext_strtab, | 
|  | (void *) (uintptr_t) | 
|  | atom->csa_external_offset, | 
|  | (void *) atom->csa_str) < 0) | 
|  | { | 
|  | /* No need to bother freeing the syn_ext_strtab: it will get freed at | 
|  | ctf_str_write_strtab time if unreferenced.  */ | 
|  | ctf_set_errno (fp, ENOMEM); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | /* Note that refs have moved from (SRC, LEN) to DEST.  We use the movable | 
|  | refs backpointer for this, because it is done an amortized-constant | 
|  | number of times during structure member and enumerand addition, and if we | 
|  | did a linear search this would turn such addition into an O(n^2) | 
|  | operation.  Even this is not linear, but it's better than that.  */ | 
|  | int | 
|  | ctf_str_move_refs (ctf_dict_t *fp, void *src, size_t len, void *dest) | 
|  | { | 
|  | uintptr_t p; | 
|  |  | 
|  | if (src == dest) | 
|  | return 0; | 
|  |  | 
|  | for (p = (uintptr_t) src; p - (uintptr_t) src < len; p++) | 
|  | { | 
|  | ctf_str_atom_ref_movable_t *ref; | 
|  |  | 
|  | if ((ref = ctf_dynhash_lookup (fp->ctf_str_movable_refs, | 
|  | (ctf_str_atom_ref_t *) p)) != NULL) | 
|  | { | 
|  | int out_of_memory; | 
|  |  | 
|  | ref->caf_ref = (uint32_t *) (((uintptr_t) ref->caf_ref + | 
|  | (uintptr_t) dest - (uintptr_t) src)); | 
|  | ctf_dynhash_remove (fp->ctf_str_movable_refs, | 
|  | (ctf_str_atom_ref_t *) p); | 
|  | out_of_memory = ctf_dynhash_insert (fp->ctf_str_movable_refs, | 
|  | ref->caf_ref, ref); | 
|  | assert (out_of_memory == 0); | 
|  | } | 
|  | } | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* Remove a single ref.  */ | 
|  | void | 
|  | ctf_str_remove_ref (ctf_dict_t *fp, const char *str, uint32_t *ref) | 
|  | { | 
|  | ctf_str_atom_ref_t *aref, *anext; | 
|  | ctf_str_atom_ref_movable_t *amovref, *amovnext; | 
|  | ctf_str_atom_t *atom = NULL; | 
|  |  | 
|  | atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str); | 
|  | if (!atom) | 
|  | return; | 
|  |  | 
|  | for (aref = ctf_list_next (&atom->csa_refs); aref != NULL; aref = anext) | 
|  | { | 
|  | anext = ctf_list_next (aref); | 
|  | if (aref->caf_ref == ref) | 
|  | { | 
|  | ctf_list_delete (&atom->csa_refs, aref); | 
|  | free (aref); | 
|  | } | 
|  | } | 
|  |  | 
|  | for (amovref = ctf_list_next (&atom->csa_movable_refs); | 
|  | amovref != NULL; amovref = amovnext) | 
|  | { | 
|  | amovnext = ctf_list_next (amovref); | 
|  | if (amovref->caf_ref == ref) | 
|  | { | 
|  | ctf_list_delete (&atom->csa_movable_refs, amovref); | 
|  | ctf_dynhash_remove (fp->ctf_str_movable_refs, ref); | 
|  | free (amovref); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | /* A ctf_dynhash_iter_remove() callback that removes atoms later than a given | 
|  | snapshot ID.  External atoms are never removed, because they came from the | 
|  | linker string table and are still present even if you roll back type | 
|  | additions.  */ | 
|  | static int | 
|  | ctf_str_rollback_atom (void *key _libctf_unused_, void *value, void *arg) | 
|  | { | 
|  | ctf_str_atom_t *atom = (ctf_str_atom_t *) value; | 
|  | ctf_snapshot_id_t *id = (ctf_snapshot_id_t *) arg; | 
|  |  | 
|  | return (atom->csa_snapshot_id > id->snapshot_id) | 
|  | && (atom->csa_external_offset == 0); | 
|  | } | 
|  |  | 
|  | /* Roll back, deleting all (internal) atoms created after a particular ID.  */ | 
|  | void | 
|  | ctf_str_rollback (ctf_dict_t *fp, ctf_snapshot_id_t id) | 
|  | { | 
|  | ctf_dynhash_iter_remove (fp->ctf_str_atoms, ctf_str_rollback_atom, &id); | 
|  | } | 
|  |  | 
|  | /* An adaptor around ctf_purge_atom_refs.  */ | 
|  | static void | 
|  | ctf_str_purge_one_atom_refs (void *key _libctf_unused_, void *value, | 
|  | void *arg _libctf_unused_) | 
|  | { | 
|  | ctf_str_atom_t *atom = (ctf_str_atom_t *) value; | 
|  |  | 
|  | ctf_str_purge_atom_refs (atom); | 
|  | } | 
|  |  | 
|  | /* Remove all the recorded refs from the atoms table.  */ | 
|  | static void | 
|  | ctf_str_purge_refs (ctf_dict_t *fp) | 
|  | { | 
|  | ctf_dynhash_iter (fp->ctf_str_atoms, ctf_str_purge_one_atom_refs, NULL); | 
|  | } | 
|  |  | 
|  | /* Update a list of refs to the specified value. */ | 
|  | static void | 
|  | ctf_str_update_refs (ctf_str_atom_t *refs, uint32_t value) | 
|  | { | 
|  | ctf_str_atom_ref_t *ref; | 
|  | ctf_str_atom_ref_movable_t *movref; | 
|  |  | 
|  | for (ref = ctf_list_next (&refs->csa_refs); ref != NULL; | 
|  | ref = ctf_list_next (ref)) | 
|  | *(ref->caf_ref) = value; | 
|  |  | 
|  | for (movref = ctf_list_next (&refs->csa_movable_refs); | 
|  | movref != NULL; movref = ctf_list_next (movref)) | 
|  | *(movref->caf_ref) = value; | 
|  | } | 
|  |  | 
|  | /* Sort the strtab.  */ | 
|  | static int | 
|  | ctf_str_sort_strtab (const void *a, const void *b) | 
|  | { | 
|  | ctf_str_atom_t **one = (ctf_str_atom_t **) a; | 
|  | ctf_str_atom_t **two = (ctf_str_atom_t **) b; | 
|  |  | 
|  | return (strcmp ((*one)->csa_str, (*two)->csa_str)); | 
|  | } | 
|  |  | 
|  | /* Write out and return a strtab containing all strings with recorded refs, | 
|  | adjusting the refs to refer to the corresponding string.  The returned | 
|  | strtab is already assigned to strtab 0 in this dict, is owned by this | 
|  | dict, and may be NULL on error.  Also populate the synthetic strtab with | 
|  | mappings from external strtab offsets to names, so we can look them up | 
|  | with ctf_strptr().  Only external strtab offsets with references are | 
|  | added. | 
|  |  | 
|  | As a side effect, replaces the strtab of the current dict with the newly- | 
|  | generated strtab.  This is an exception to the general rule that | 
|  | serialization does not change the dict passed in, because the alternative | 
|  | is to copy the entire atoms table on every reserialization just to avoid | 
|  | modifying the original, which is excessively costly for minimal gain. | 
|  |  | 
|  | We use the lazy man's approach and double memory costs by always storing | 
|  | atoms as individually allocated entities whenever they come from anywhere | 
|  | but a freshly-opened, mmapped dict, even though after serialization there | 
|  | is another copy in the strtab; this ensures that ctf_strptr()-returned | 
|  | pointers to them remain valid for the lifetime of the dict. | 
|  |  | 
|  | This is all rendered more complex because if a dict is ctf_open()ed it | 
|  | will have a bunch of strings in its strtab already, and their strtab | 
|  | offsets can never change (without piles of complexity to rescan the | 
|  | entire dict just to get all the offsets to all of them into the atoms | 
|  | table).  Entries below the existing strtab limit are just copied into the | 
|  | new dict: entries above it are new, and are are sorted first, then | 
|  | appended to it.  The sorting is purely a compression-efficiency | 
|  | improvement, and we get nearly as good an improvement from sorting big | 
|  | chunks like this as we would from sorting the whole thing.  */ | 
|  |  | 
|  | const ctf_strs_writable_t * | 
|  | ctf_str_write_strtab (ctf_dict_t *fp) | 
|  | { | 
|  | ctf_strs_writable_t *strtab; | 
|  | size_t strtab_count = 0; | 
|  | uint32_t cur_stroff = 0; | 
|  | ctf_str_atom_t **sorttab; | 
|  | ctf_next_t *it = NULL; | 
|  | size_t i; | 
|  | void *v; | 
|  | int err; | 
|  | int new_strtab = 0; | 
|  | int any_external = 0; | 
|  |  | 
|  | strtab = calloc (1, sizeof (ctf_strs_writable_t)); | 
|  | if (!strtab) | 
|  | return NULL; | 
|  |  | 
|  | /* The strtab contains the existing string table at its start: figure out | 
|  | how many new strings we need to add.  We only need to add new strings | 
|  | that have no external offset, that have refs, and that are found in the | 
|  | provisional strtab.  If the existing strtab is empty we also need to | 
|  | add the null string at its start.  */ | 
|  |  | 
|  | strtab->cts_len = fp->ctf_str[CTF_STRTAB_0].cts_len; | 
|  |  | 
|  | if (strtab->cts_len == 0) | 
|  | { | 
|  | new_strtab = 1; | 
|  | strtab->cts_len++; 			/* For the \0.  */ | 
|  | } | 
|  |  | 
|  | /* Count new entries in the strtab: i.e. entries in the provisional | 
|  | strtab.  Ignore any entry for \0, entries which ended up in the | 
|  | external strtab, and unreferenced entries.  */ | 
|  |  | 
|  | while ((err = ctf_dynhash_next (fp->ctf_prov_strtab, &it, NULL, &v)) == 0) | 
|  | { | 
|  | const char *str = (const char *) v; | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | atom = ctf_dynhash_lookup (fp->ctf_str_atoms, str); | 
|  | if (!ctf_assert (fp, atom)) | 
|  | goto err_strtab; | 
|  |  | 
|  | if (atom->csa_str[0] == 0 || atom->csa_external_offset | 
|  | || (ctf_list_empty_p (&atom->csa_refs) | 
|  | && ctf_list_empty_p (&atom->csa_movable_refs))) | 
|  | continue; | 
|  |  | 
|  | strtab->cts_len += strlen (atom->csa_str) + 1; | 
|  | strtab_count++; | 
|  | } | 
|  | if (err != ECTF_NEXT_END) | 
|  | { | 
|  | ctf_dprintf ("ctf_str_write_strtab: error counting strtab entries: %s\n", | 
|  | ctf_errmsg (err)); | 
|  | goto err_strtab; | 
|  | } | 
|  |  | 
|  | ctf_dprintf ("%lu bytes of strings in strtab: %lu pre-existing.\n", | 
|  | (unsigned long) strtab->cts_len, | 
|  | (unsigned long) fp->ctf_str[CTF_STRTAB_0].cts_len); | 
|  |  | 
|  | /* Sort the new part of the strtab.  */ | 
|  |  | 
|  | sorttab = calloc (strtab_count, sizeof (ctf_str_atom_t *)); | 
|  | if (!sorttab) | 
|  | { | 
|  | ctf_set_errno (fp, ENOMEM); | 
|  | goto err_strtab; | 
|  | } | 
|  |  | 
|  | i = 0; | 
|  | while ((err = ctf_dynhash_next (fp->ctf_prov_strtab, &it, NULL, &v)) == 0) | 
|  | { | 
|  | ctf_str_atom_t *atom; | 
|  |  | 
|  | atom = ctf_dynhash_lookup (fp->ctf_str_atoms, v); | 
|  | if (!ctf_assert (fp, atom)) | 
|  | goto err_sorttab; | 
|  |  | 
|  | if (atom->csa_str[0] == 0 || atom->csa_external_offset | 
|  | || (ctf_list_empty_p (&atom->csa_refs) | 
|  | && ctf_list_empty_p (&atom->csa_movable_refs))) | 
|  | continue; | 
|  |  | 
|  | sorttab[i++] = atom; | 
|  | } | 
|  |  | 
|  | qsort (sorttab, strtab_count, sizeof (ctf_str_atom_t *), | 
|  | ctf_str_sort_strtab); | 
|  |  | 
|  | if ((strtab->cts_strs = malloc (strtab->cts_len)) == NULL) | 
|  | goto err_sorttab; | 
|  |  | 
|  | cur_stroff = fp->ctf_str[CTF_STRTAB_0].cts_len; | 
|  |  | 
|  | if (new_strtab) | 
|  | { | 
|  | strtab->cts_strs[0] = 0; | 
|  | cur_stroff++; | 
|  | } | 
|  | else | 
|  | memcpy (strtab->cts_strs, fp->ctf_str[CTF_STRTAB_0].cts_strs, | 
|  | fp->ctf_str[CTF_STRTAB_0].cts_len); | 
|  |  | 
|  | /* Work over the sorttab, add its strings to the strtab, and remember | 
|  | where they are in the csa_offset for the appropriate atom.  No ref | 
|  | updating is done at this point, because refs might well relate to | 
|  | already-existing strings, or external strings, which do not need adding | 
|  | to the strtab and may not be in the sorttab.  */ | 
|  |  | 
|  | for (i = 0; i < strtab_count; i++) | 
|  | { | 
|  | sorttab[i]->csa_offset = cur_stroff; | 
|  | strcpy (&strtab->cts_strs[cur_stroff], sorttab[i]->csa_str); | 
|  | cur_stroff += strlen (sorttab[i]->csa_str) + 1; | 
|  | } | 
|  | free (sorttab); | 
|  | sorttab = NULL; | 
|  |  | 
|  | /* Update all refs, then purge them as no longer necessary: also update | 
|  | the strtab appropriately.  */ | 
|  |  | 
|  | while ((err = ctf_dynhash_next (fp->ctf_str_atoms, &it, NULL, &v)) == 0) | 
|  | { | 
|  | ctf_str_atom_t *atom = (ctf_str_atom_t *) v; | 
|  | uint32_t offset; | 
|  |  | 
|  | if (ctf_list_empty_p (&atom->csa_refs) && | 
|  | ctf_list_empty_p (&atom->csa_movable_refs)) | 
|  | continue; | 
|  |  | 
|  | if (atom->csa_external_offset) | 
|  | { | 
|  | any_external = 1; | 
|  | offset = atom->csa_external_offset; | 
|  | } | 
|  | else | 
|  | offset = atom->csa_offset; | 
|  | ctf_str_update_refs (atom, offset); | 
|  | } | 
|  | if (err != ECTF_NEXT_END) | 
|  | { | 
|  | ctf_dprintf ("ctf_str_write_strtab: error iterating over atoms while updating refs: %s\n", | 
|  | ctf_errmsg (err)); | 
|  | goto err_strtab; | 
|  | } | 
|  | ctf_str_purge_refs (fp); | 
|  |  | 
|  | if (!any_external) | 
|  | { | 
|  | ctf_dynhash_destroy (fp->ctf_syn_ext_strtab); | 
|  | fp->ctf_syn_ext_strtab = NULL; | 
|  | } | 
|  |  | 
|  | /* Replace the old strtab with the new one in this dict.  */ | 
|  |  | 
|  | if (fp->ctf_dynstrtab) | 
|  | { | 
|  | free (fp->ctf_dynstrtab->cts_strs); | 
|  | free (fp->ctf_dynstrtab); | 
|  | } | 
|  |  | 
|  | fp->ctf_dynstrtab = strtab; | 
|  | fp->ctf_str[CTF_STRTAB_0].cts_strs = strtab->cts_strs; | 
|  | fp->ctf_str[CTF_STRTAB_0].cts_len = strtab->cts_len; | 
|  |  | 
|  | /* All the provisional strtab entries are now real strtab entries, and | 
|  | ctf_strptr() will find them there.  The provisional offset now starts right | 
|  | beyond the new end of the strtab.  */ | 
|  |  | 
|  | ctf_dynhash_empty (fp->ctf_prov_strtab); | 
|  | fp->ctf_str_prov_offset = strtab->cts_len + 1; | 
|  | return strtab; | 
|  |  | 
|  | err_sorttab: | 
|  | free (sorttab); | 
|  | err_strtab: | 
|  | free (strtab); | 
|  | return NULL; | 
|  | } |