b1dca6
commit 73b6e50a22dea9ae6144beaaa675d2ac62c281ca
b1dca6
Author: Florian Weimer <fweimer@redhat.com>
b1dca6
Date:   Fri Dec 4 09:13:43 2020 +0100
b1dca6
b1dca6
    elf: Implement tail merging of strings in ldconfig
b1dca6
    
b1dca6
    This simplifies the string table construction in elf/cache.c
b1dca6
    because there is no more need to keep track of offsets explicitly;
b1dca6
    the string table implementation does this internally.
b1dca6
    
b1dca6
    This change slightly reduces the size of the cache on disk.  The
b1dca6
    file format does not change as a result.  The strings are
b1dca6
    null-terminated, without explicit length, so tail merging is
b1dca6
    transparent to readers.
b1dca6
    
b1dca6
    Reviewed-by: Adhemerval Zanella  <adhemerval.zanella@linaro.org>
b1dca6
b1dca6
diff --git a/elf/Makefile b/elf/Makefile
b1dca6
index abb3e9d1179ef5cd..a3e802a9a99b759c 100644
b1dca6
--- a/elf/Makefile
b1dca6
+++ b/elf/Makefile
b1dca6
@@ -112,7 +112,8 @@ others-static	+= ldconfig
b1dca6
 others		+= ldconfig
b1dca6
 install-rootsbin += ldconfig
b1dca6
 
b1dca6
-ldconfig-modules := cache readlib xmalloc xstrdup chroot_canon static-stubs
b1dca6
+ldconfig-modules := cache readlib xmalloc xstrdup chroot_canon static-stubs \
b1dca6
+  stringtable
b1dca6
 extra-objs	+= $(ldconfig-modules:=.o)
b1dca6
 others-extras   = $(ldconfig-modules)
b1dca6
 endif
b1dca6
diff --git a/elf/cache.c b/elf/cache.c
b1dca6
index 5a8f1ad70cc3fead..f773cacacf26db1c 100644
b1dca6
--- a/elf/cache.c
b1dca6
+++ b/elf/cache.c
b1dca6
@@ -35,11 +35,15 @@
b1dca6
 #include <ldconfig.h>
b1dca6
 #include <dl-cache.h>
b1dca6
 #include <version.h>
b1dca6
+#include <stringtable.h>
b1dca6
+
b1dca6
+/* Used to store library names, paths, and other strings.  */
b1dca6
+static struct stringtable strings;
b1dca6
 
b1dca6
 struct cache_entry
b1dca6
 {
b1dca6
-  char *lib;			/* Library name.  */
b1dca6
-  char *path;			/* Path to find library.  */
b1dca6
+  struct stringtable_entry *lib; /* Library name.  */
b1dca6
+  struct stringtable_entry *path; /* Path to find library.  */
b1dca6
   int flags;			/* Flags to indicate kind of library.  */
b1dca6
   unsigned int osversion;	/* Required OS version.  */
b1dca6
   uint64_t hwcap;		/* Important hardware capabilities.  */
b1dca6
@@ -300,7 +304,7 @@ static int
b1dca6
 compare (const struct cache_entry *e1, const struct cache_entry *e2)
b1dca6
 {
b1dca6
   /* We need to swap entries here to get the correct sort order.  */
b1dca6
-  int res = _dl_cache_libcmp (e2->lib, e1->lib);
b1dca6
+  int res = _dl_cache_libcmp (e2->lib->string, e1->lib->string);
b1dca6
   if (res == 0)
b1dca6
     {
b1dca6
       if (e1->flags < e2->flags)
b1dca6
@@ -369,26 +373,24 @@ save_cache (const char *cache_name)
b1dca6
 {
b1dca6
   /* The cache entries are sorted already, save them in this order. */
b1dca6
 
b1dca6
-  /* Count the length of all strings.  */
b1dca6
-  /* The old format doesn't contain hwcap entries and doesn't contain
b1dca6
-     libraries in subdirectories with hwcaps entries.  Count therefore
b1dca6
-     also all entries with hwcap == 0.  */
b1dca6
-  size_t total_strlen = 0;
b1dca6
   struct cache_entry *entry;
b1dca6
   /* Number of cache entries.  */
b1dca6
   int cache_entry_count = 0;
b1dca6
-  /* Number of normal cache entries.  */
b1dca6
+  /* The old format doesn't contain hwcap entries and doesn't contain
b1dca6
+     libraries in subdirectories with hwcaps entries.  Count therefore
b1dca6
+     also all entries with hwcap == 0.  */
b1dca6
   int cache_entry_old_count = 0;
b1dca6
 
b1dca6
   for (entry = entries; entry != NULL; entry = entry->next)
b1dca6
     {
b1dca6
-      /* Account the final NULs.  */
b1dca6
-      total_strlen += strlen (entry->lib) + strlen (entry->path) + 2;
b1dca6
       ++cache_entry_count;
b1dca6
       if (entry->hwcap == 0)
b1dca6
 	++cache_entry_old_count;
b1dca6
     }
b1dca6
 
b1dca6
+  struct stringtable_finalized strings_finalized;
b1dca6
+  stringtable_finalize (&strings, &strings_finalized);
b1dca6
+
b1dca6
   /* Create the on disk cache structure.  */
b1dca6
   struct cache_file *file_entries = NULL;
b1dca6
   size_t file_entries_size = 0;
b1dca6
@@ -432,7 +434,7 @@ save_cache (const char *cache_name)
b1dca6
 	      sizeof CACHE_VERSION - 1);
b1dca6
 
b1dca6
       file_entries_new->nlibs = cache_entry_count;
b1dca6
-      file_entries_new->len_strings = total_strlen;
b1dca6
+      file_entries_new->len_strings = strings_finalized.size;
b1dca6
       file_entries_new->flags = cache_file_new_flags_endian_current;
b1dca6
     }
b1dca6
 
b1dca6
@@ -449,20 +451,20 @@ save_cache (const char *cache_name)
b1dca6
     str_offset = 0;
b1dca6
 
b1dca6
   /* An array for all strings.  */
b1dca6
-  char *strings = xmalloc (total_strlen);
b1dca6
-  char *str = strings;
b1dca6
   int idx_old;
b1dca6
   int idx_new;
b1dca6
 
b1dca6
   for (idx_old = 0, idx_new = 0, entry = entries; entry != NULL;
b1dca6
        entry = entry->next, ++idx_new)
b1dca6
     {
b1dca6
-      /* First the library.  */
b1dca6
       if (opt_format != opt_format_new && entry->hwcap == 0)
b1dca6
 	{
b1dca6
 	  file_entries->libs[idx_old].flags = entry->flags;
b1dca6
 	  /* XXX: Actually we can optimize here and remove duplicates.  */
b1dca6
 	  file_entries->libs[idx_old].key = str_offset + pad;
b1dca6
+	  file_entries->libs[idx_new].key = str_offset + entry->lib->offset;
b1dca6
+	  file_entries->libs[idx_new].value
b1dca6
+	    = str_offset + entry->path->offset;
b1dca6
 	}
b1dca6
       if (opt_format != opt_format_old)
b1dca6
 	{
b1dca6
@@ -473,20 +475,12 @@ save_cache (const char *cache_name)
b1dca6
 	  file_entries_new->libs[idx_new].flags = entry->flags;
b1dca6
 	  file_entries_new->libs[idx_new].osversion = entry->osversion;
b1dca6
 	  file_entries_new->libs[idx_new].hwcap = entry->hwcap;
b1dca6
-	  file_entries_new->libs[idx_new].key = str_offset;
b1dca6
+	  file_entries_new->libs[idx_new].key
b1dca6
+	    = str_offset + entry->lib->offset;
b1dca6
+	  file_entries_new->libs[idx_new].value
b1dca6
+	    = str_offset + entry->path->offset;
b1dca6
 	}
b1dca6
 
b1dca6
-      size_t len = strlen (entry->lib) + 1;
b1dca6
-      str = mempcpy (str, entry->lib, len);
b1dca6
-      str_offset += len;
b1dca6
-      /* Then the path.  */
b1dca6
-      if (opt_format != opt_format_new && entry->hwcap == 0)
b1dca6
-	file_entries->libs[idx_old].value = str_offset + pad;
b1dca6
-      if (opt_format != opt_format_old)
b1dca6
-	file_entries_new->libs[idx_new].value = str_offset;
b1dca6
-      len = strlen (entry->path) + 1;
b1dca6
-      str = mempcpy (str, entry->path, len);
b1dca6
-      str_offset += len;
b1dca6
       /* Ignore entries with hwcap for old format.  */
b1dca6
       if (entry->hwcap == 0)
b1dca6
 	++idx_old;
b1dca6
@@ -511,7 +505,7 @@ save_cache (const char *cache_name)
b1dca6
 	extension_offset += pad;
b1dca6
       extension_offset += file_entries_new_size;
b1dca6
     }
b1dca6
-  extension_offset += total_strlen;
b1dca6
+  extension_offset += strings_finalized.size;
b1dca6
   extension_offset = roundup (extension_offset, 4); /* Provide alignment.  */
b1dca6
   if (opt_format != opt_format_old)
b1dca6
     file_entries_new->extension_offset = extension_offset;
b1dca6
@@ -551,7 +545,8 @@ save_cache (const char *cache_name)
b1dca6
 	error (EXIT_FAILURE, errno, _("Writing of cache data failed"));
b1dca6
     }
b1dca6
 
b1dca6
-  if (write (fd, strings, total_strlen) != (ssize_t) total_strlen)
b1dca6
+  if (write (fd, strings_finalized.strings, strings_finalized.size)
b1dca6
+      != (ssize_t) strings_finalized.size)
b1dca6
     error (EXIT_FAILURE, errno, _("Writing of cache data failed"));
b1dca6
 
b1dca6
   if (opt_format != opt_format_old)
b1dca6
@@ -580,7 +575,7 @@ save_cache (const char *cache_name)
b1dca6
   /* Free all allocated memory.  */
b1dca6
   free (file_entries_new);
b1dca6
   free (file_entries);
b1dca6
-  free (strings);
b1dca6
+  free (strings_finalized.strings);
b1dca6
 
b1dca6
   while (entries)
b1dca6
     {
b1dca6
@@ -596,14 +591,19 @@ void
b1dca6
 add_to_cache (const char *path, const char *lib, int flags,
b1dca6
 	      unsigned int osversion, uint64_t hwcap)
b1dca6
 {
b1dca6
-  size_t liblen = strlen (lib) + 1;
b1dca6
-  size_t len = liblen + strlen (path) + 1;
b1dca6
-  struct cache_entry *new_entry
b1dca6
-    = xmalloc (sizeof (struct cache_entry) + liblen + len);
b1dca6
-
b1dca6
-  new_entry->lib = memcpy ((char *) (new_entry + 1), lib, liblen);
b1dca6
-  new_entry->path = new_entry->lib + liblen;
b1dca6
-  snprintf (new_entry->path, len, "%s/%s", path, lib);
b1dca6
+  struct cache_entry *new_entry = xmalloc (sizeof (*new_entry));
b1dca6
+
b1dca6
+  struct stringtable_entry *path_interned;
b1dca6
+  {
b1dca6
+    char *p;
b1dca6
+    if (asprintf (&p, "%s/%s", path, lib) < 0)
b1dca6
+      error (EXIT_FAILURE, errno, _("Could not create library path"));
b1dca6
+    path_interned = stringtable_add (&strings, p);
b1dca6
+    free (p);
b1dca6
+  }
b1dca6
+
b1dca6
+  new_entry->lib = stringtable_add (&strings, lib);
b1dca6
+  new_entry->path = path_interned;
b1dca6
   new_entry->flags = flags;
b1dca6
   new_entry->osversion = osversion;
b1dca6
   new_entry->hwcap = hwcap;