Blame SOURCES/ltrace-0.7.91-ppc64-unprelink.patch

2e4be5
From a0093ca43cf40d7e5f6cebeb64156062d2de46d9 Mon Sep 17 00:00:00 2001
2e4be5
From: Petr Machata <pmachata@redhat.com>
2e4be5
Date: Fri, 10 Jan 2014 20:06:51 +0100
2e4be5
Subject: [PATCH 2/2] Don't crash untraced calls via PLT in prelinked PPC64
2e4be5
 binaries
2e4be5
2e4be5
In prelinked binaries, ltrace has to unprelinks PLT slots in order to
2e4be5
catch calls done through PLT.  This makes the calls done through these
2e4be5
slots invalid, because the special first PLT slot is not initialized,
2e4be5
and dynamic linker SIGSEGVs because of this.  Ltrace relies on
2e4be5
arranging breakpoints such that the dynamic linker is not actually
2e4be5
entered, and moves PC around itself to simulate the effects of a call
2e4be5
through PLT.
2e4be5
2e4be5
Originally, arch_elf_add_plt_entry was called only for symbols that
2e4be5
were actually traced.  Later this was changed and it's now called for
2e4be5
all PLT entries, and the resulting candidate list is filtered
2e4be5
afterwards.  This gives backends a chance to rename the symbol, as is
2e4be5
useful with IRELATIVE PLT calls, where symbol name may not be
2e4be5
available at all.  But the PPC backend was never updated to reflect
2e4be5
this, and unresolved all symbols for which arch_elf_add_plt_entry was
2e4be5
called, thus rendering _all_ PLT slots invalid, even those that
2e4be5
weren't later procted by breakpoints.  Thus calls done through any
2e4be5
untraced slots failed.
2e4be5
2e4be5
This patch fixes this problem by deferring the unprelinking of PLT
2e4be5
slots into the on_install hook of breakpoints.
2e4be5
---
2e4be5
 sysdeps/linux-gnu/ppc/arch.h |   21 ++++++++-
2e4be5
 sysdeps/linux-gnu/ppc/plt.c  |   94 +++++++++++++++++++++++++++++++++--------
2e4be5
 2 files changed, 94 insertions(+), 21 deletions(-)
2e4be5
2e4be5
diff --git a/sysdeps/linux-gnu/ppc/arch.h b/sysdeps/linux-gnu/ppc/arch.h
2e4be5
index 2add3b8..bf9b5dc 100644
2e4be5
--- a/sysdeps/linux-gnu/ppc/arch.h
2e4be5
+++ b/sysdeps/linux-gnu/ppc/arch.h
2e4be5
@@ -1,6 +1,6 @@
2e4be5
 /*
2e4be5
  * This file is part of ltrace.
2e4be5
- * Copyright (C) 2012,2013 Petr Machata
2e4be5
+ * Copyright (C) 2012,2013,2014 Petr Machata
2e4be5
  * Copyright (C) 2006 Paul Gilliam
2e4be5
  * Copyright (C) 2002,2004 Juan Cespedes
2e4be5
  *
2e4be5
@@ -87,12 +87,29 @@ enum ppc64_plt_type {
2e4be5
 	/* Very similar to PPC_PLT_UNRESOLVED, but for JMP_IREL
2e4be5
 	 * slots.  */
2e4be5
 	PPC_PLT_IRELATIVE,
2e4be5
+
2e4be5
+	/* Transitional state before the breakpoint is enabled.  */
2e4be5
+	PPC_PLT_NEED_UNRESOLVE,
2e4be5
 };
2e4be5
 
2e4be5
 #define ARCH_HAVE_LIBRARY_SYMBOL_DATA
2e4be5
+struct ppc_unresolve_data;
2e4be5
 struct arch_library_symbol_data {
2e4be5
 	enum ppc64_plt_type type;
2e4be5
-	GElf_Addr resolved_value;
2e4be5
+
2e4be5
+	/* State		Contents
2e4be5
+	 *
2e4be5
+	 * PPC_DEFAULT		N/A
2e4be5
+	 * PPC64_PLT_STUB	N/A
2e4be5
+	 * PPC_PLT_UNRESOLVED	PLT entry address.
2e4be5
+	 * PPC_PLT_IRELATIVE	Likewise.
2e4be5
+	 * PPC_PLT_RESOLVED	The original value the slot was resolved to.
2e4be5
+	 * PPC_PLT_NEED_UNRESOLVE	DATA.
2e4be5
+	 */
2e4be5
+	union {
2e4be5
+		GElf_Addr resolved_value;
2e4be5
+		struct ppc_unresolve_data *data;
2e4be5
+	};
2e4be5
 
2e4be5
 	/* Address of corresponding slot in .plt.  */
2e4be5
 	GElf_Addr plt_slot_addr;
2e4be5
diff --git a/sysdeps/linux-gnu/ppc/plt.c b/sysdeps/linux-gnu/ppc/plt.c
2e4be5
index 8715da6..332daa8 100644
2e4be5
--- a/sysdeps/linux-gnu/ppc/plt.c
2e4be5
+++ b/sysdeps/linux-gnu/ppc/plt.c
2e4be5
@@ -679,6 +679,14 @@ arch_elf_add_func_entry(struct process *proc, struct ltelf *lte,
2e4be5
 	return PLT_OK;
2e4be5
 }
2e4be5
 
2e4be5
+struct ppc_unresolve_data {
2e4be5
+	struct ppc_unresolve_data *self; /* A canary.  */
2e4be5
+	GElf_Addr plt_entry_addr;
2e4be5
+	GElf_Addr plt_slot_addr;
2e4be5
+	GElf_Addr plt_slot_value;
2e4be5
+	bool is_irelative;
2e4be5
+};
2e4be5
+
2e4be5
 enum plt_status
2e4be5
 arch_elf_add_plt_entry(struct process *proc, struct ltelf *lte,
2e4be5
 		       const char *a_name, GElf_Rela *rela, size_t ndx,
2e4be5
@@ -778,28 +786,23 @@ arch_elf_add_plt_entry(struct process *proc, struct ltelf *lte,
2e4be5
 	    && (plt_slot_value == plt_entry_addr || plt_slot_value == 0)) {
2e4be5
 		libsym->arch.type = PPC_PLT_UNRESOLVED;
2e4be5
 		libsym->arch.resolved_value = plt_entry_addr;
2e4be5
-
2e4be5
 	} else {
2e4be5
-		/* Unresolve the .plt slot.  If the binary was
2e4be5
-		 * prelinked, this makes the code invalid, because in
2e4be5
-		 * case of prelinked binary, the dynamic linker
2e4be5
-		 * doesn't update .plt[0] and .plt[1] with addresses
2e4be5
-		 * of the resover.  But we don't care, we will never
2e4be5
-		 * need to enter the resolver.  That just means that
2e4be5
-		 * we have to un-un-resolve this back before we
2e4be5
-		 * detach.  */
2e4be5
-
2e4be5
-		if (unresolve_plt_slot(proc, plt_slot_addr, plt_entry_addr) < 0) {
2e4be5
-			library_symbol_destroy(libsym);
2e4be5
+		/* Mark the symbol for later unresolving.  We may not
2e4be5
+		 * do this right away, as this is called by ltrace
2e4be5
+		 * core for all symbols, and only later filtered.  We
2e4be5
+		 * only unresolve the symbol before the breakpoint is
2e4be5
+		 * enabled.  */
2e4be5
+
2e4be5
+		libsym->arch.type = PPC_PLT_NEED_UNRESOLVE;
2e4be5
+		libsym->arch.data = malloc(sizeof *libsym->arch.data);
2e4be5
+		if (libsym->arch.data == NULL)
2e4be5
 			goto fail2;
2e4be5
-		}
2e4be5
 
2e4be5
-		if (! is_irelative) {
2e4be5
-			mark_as_resolved(libsym, plt_slot_value);
2e4be5
-		} else {
2e4be5
-			libsym->arch.type = PPC_PLT_IRELATIVE;
2e4be5
-			libsym->arch.resolved_value = plt_entry_addr;
2e4be5
-		}
2e4be5
+		libsym->arch.data->self = libsym->arch.data;
2e4be5
+		libsym->arch.data->plt_entry_addr = plt_entry_addr;
2e4be5
+		libsym->arch.data->plt_slot_addr = plt_slot_addr;
2e4be5
+		libsym->arch.data->plt_slot_value = plt_slot_value;
2e4be5
+		libsym->arch.data->is_irelative = is_irelative;
2e4be5
 	}
2e4be5
 
2e4be5
 	*ret = libsym;
2e4be5
@@ -999,6 +1002,7 @@ ppc_plt_bp_continue(struct breakpoint *bp, struct process *proc)
2e4be5
 		return;
2e4be5
 
2e4be5
 	case PPC64_PLT_STUB:
2e4be5
+	case PPC_PLT_NEED_UNRESOLVE:
2e4be5
 		/* These should never hit here.  */
2e4be5
 		break;
2e4be5
 	}
2e4be5
@@ -1050,6 +1054,52 @@ ppc_plt_bp_retract(struct breakpoint *bp, struct process *proc)
2e4be5
 	}
2e4be5
 }
2e4be5
 
2e4be5
+static void
2e4be5
+ppc_plt_bp_install(struct breakpoint *bp, struct process *proc)
2e4be5
+{
2e4be5
+	/* This should not be an artificial breakpoint.  */
2e4be5
+	struct library_symbol *libsym = bp->libsym;
2e4be5
+	if (libsym == NULL)
2e4be5
+		libsym = bp->arch.irel_libsym;
2e4be5
+	assert(libsym != NULL);
2e4be5
+
2e4be5
+	if (libsym->arch.type == PPC_PLT_NEED_UNRESOLVE) {
2e4be5
+		/* Unresolve the .plt slot.  If the binary was
2e4be5
+		 * prelinked, this makes the code invalid, because in
2e4be5
+		 * case of prelinked binary, the dynamic linker
2e4be5
+		 * doesn't update .plt[0] and .plt[1] with addresses
2e4be5
+		 * of the resover.  But we don't care, we will never
2e4be5
+		 * need to enter the resolver.  That just means that
2e4be5
+		 * we have to un-un-resolve this back before we
2e4be5
+		 * detach.  */
2e4be5
+
2e4be5
+		struct ppc_unresolve_data *data = libsym->arch.data;
2e4be5
+		libsym->arch.data = NULL;
2e4be5
+		assert(data->self == data);
2e4be5
+
2e4be5
+		GElf_Addr plt_slot_addr = data->plt_slot_addr;
2e4be5
+		GElf_Addr plt_slot_value = data->plt_slot_value;
2e4be5
+		GElf_Addr plt_entry_addr = data->plt_entry_addr;
2e4be5
+
2e4be5
+		if (unresolve_plt_slot(proc, plt_slot_addr,
2e4be5
+				       plt_entry_addr) == 0) {
2e4be5
+			if (! data->is_irelative) {
2e4be5
+				mark_as_resolved(libsym, plt_slot_value);
2e4be5
+			} else {
2e4be5
+				libsym->arch.type = PPC_PLT_IRELATIVE;
2e4be5
+				libsym->arch.resolved_value = plt_entry_addr;
2e4be5
+			}
2e4be5
+		} else {
2e4be5
+			fprintf(stderr, "Couldn't unresolve %s@%p.  Not tracing"
2e4be5
+				" this symbol.\n",
2e4be5
+				breakpoint_name(bp), bp->addr);
2e4be5
+			proc_remove_breakpoint(proc, bp);
2e4be5
+		}
2e4be5
+
2e4be5
+		free(data);
2e4be5
+	}
2e4be5
+}
2e4be5
+
2e4be5
 int
2e4be5
 arch_library_init(struct library *lib)
2e4be5
 {
2e4be5
@@ -1080,6 +1130,11 @@ arch_library_symbol_init(struct library_symbol *libsym)
2e4be5
 void
2e4be5
 arch_library_symbol_destroy(struct library_symbol *libsym)
2e4be5
 {
2e4be5
+	if (libsym->arch.type == PPC_PLT_NEED_UNRESOLVE) {
2e4be5
+		assert(libsym->arch.data->self == libsym->arch.data);
2e4be5
+		free(libsym->arch.data);
2e4be5
+		libsym->arch.data = NULL;
2e4be5
+	}
2e4be5
 }
2e4be5
 
2e4be5
 int
2e4be5
@@ -1115,6 +1170,7 @@ arch_breakpoint_init(struct process *proc, struct breakpoint *bp)
2e4be5
 	static struct bp_callbacks cbs = {
2e4be5
 		.on_continue = ppc_plt_bp_continue,
2e4be5
 		.on_retract = ppc_plt_bp_retract,
2e4be5
+		.on_install = ppc_plt_bp_install,
2e4be5
 	};
2e4be5
 	breakpoint_set_callbacks(bp, &cbs);
2e4be5
 
2e4be5
-- 
2e4be5
1.7.6.5
2e4be5