Blame SOURCES/ltrace-0.7.91-ppc64le-fixes.patch

e7106e
diff --git a/sysdeps/linux-gnu/ppc/arch.h b/sysdeps/linux-gnu/ppc/arch.h
e7106e
index d5ad759..a8b67bb 100644
e7106e
--- a/sysdeps/linux-gnu/ppc/arch.h
e7106e
+++ b/sysdeps/linux-gnu/ppc/arch.h
e7106e
@@ -32,36 +32,45 @@
e7106e
 #define LT_ELF_MACHINE	EM_PPC
e7106e
 
e7106e
 #ifdef __powerpc64__ // Says 'ltrace' is 64 bits, says nothing about target.
e7106e
-#define LT_ELFCLASS2	ELFCLASS64
e7106e
-#define LT_ELF_MACHINE2	EM_PPC64
e7106e
+# define LT_ELFCLASS2	ELFCLASS64
e7106e
+# define LT_ELF_MACHINE2	EM_PPC64
e7106e
 
e7106e
 # ifdef __LITTLE_ENDIAN__
e7106e
-# define BREAKPOINT_VALUE { 0x08, 0x00, 0xe0, 0x7f }
e7106e
-# define ARCH_ENDIAN_LITTLE
e7106e
+#  define BREAKPOINT_VALUE { 0x08, 0x00, 0xe0, 0x7f }
e7106e
+#  define ARCH_ENDIAN_LITTLE
e7106e
 # else
e7106e
-# define BREAKPOINT_VALUE { 0x7f, 0xe0, 0x00, 0x08 }
e7106e
-# define ARCH_SUPPORTS_OPD
e7106e
-# define ARCH_ENDIAN_BIG
e7106e
+#  define BREAKPOINT_VALUE { 0x7f, 0xe0, 0x00, 0x08 }
e7106e
+#  define ARCH_SUPPORTS_OPD
e7106e
+#  define ARCH_ENDIAN_BIG
e7106e
 # endif
e7106e
 
e7106e
-# if _CALL_ELF != 2
e7106e
-# define ARCH_SUPPORTS_OPD
e7106e
-# define STACK_FRAME_OVERHEAD 112
e7106e
+# if !defined(_CALL_ELF) || _CALL_ELF < 2
e7106e
+#  define ARCH_SUPPORTS_OPD
e7106e
+#  define STACK_FRAME_OVERHEAD 112
e7106e
 #  ifndef EF_PPC64_ABI
e7106e
-#  define EF_PPC64_ABI 3
e7106e
+#   define EF_PPC64_ABI 3
e7106e
 #  endif
e7106e
-# else /* _CALL_ELF == 2 ABIv2 */
e7106e
-# define STACK_FRAME_OVERHEAD 32
e7106e
+# elif _CALL_ELF == 2  /* ELFv2 ABI */
e7106e
+#  define STACK_FRAME_OVERHEAD 32
e7106e
+# else
e7106e
+#  error Unsupported PowerPC64 ABI.
e7106e
 # endif /* CALL_ELF */
e7106e
 
e7106e
 #else
e7106e
-#define BREAKPOINT_VALUE { 0x7f, 0xe0, 0x00, 0x08 }
e7106e
-#define ARCH_ENDIAN_BIG
e7106e
+# define STACK_FRAME_OVERHEAD 112
e7106e
+# define BREAKPOINT_VALUE { 0x7f, 0xe0, 0x00, 0x08 }
e7106e
+# define ARCH_ENDIAN_BIG
e7106e
 # ifndef EF_PPC64_ABI
e7106e
-# define EF_PPC64_ABI 3
e7106e
+#  define EF_PPC64_ABI 3
e7106e
 # endif
e7106e
 #endif 	/* __powerpc64__ */
e7106e
 
e7106e
+#ifdef _CALL_ELF
e7106e
+enum { ppc64_call_elf_abi = _CALL_ELF };
e7106e
+#else
e7106e
+enum { ppc64_call_elf_abi = 0 };
e7106e
+#endif
e7106e
+
e7106e
 #define ARCH_HAVE_SW_SINGLESTEP
e7106e
 #define ARCH_HAVE_ADD_PLT_ENTRY
e7106e
 #define ARCH_HAVE_ADD_FUNC_ENTRY
e7106e
diff --git a/sysdeps/linux-gnu/ppc/fetch.c b/sysdeps/linux-gnu/ppc/fetch.c
e7106e
index c9381c3..c6cbd71 100644
e7106e
--- a/sysdeps/linux-gnu/ppc/fetch.c
e7106e
+++ b/sysdeps/linux-gnu/ppc/fetch.c
e7106e
@@ -1,6 +1,6 @@
e7106e
 /*
e7106e
  * This file is part of ltrace.
e7106e
- * Copyright (C) 2012 Petr Machata, Red Hat Inc.
e7106e
+ * Copyright (C) 2012, 2014 Petr Machata, Red Hat Inc.
e7106e
  *
e7106e
  * This program is free software; you can redistribute it and/or
e7106e
  * modify it under the terms of the GNU General Public License as
e7106e
@@ -23,6 +23,7 @@
e7106e
 #include <stdlib.h>
e7106e
 #include <string.h>
e7106e
 #include <sys/ucontext.h>
e7106e
+#include <stdio.h>
e7106e
 
e7106e
 #include "backend.h"
e7106e
 #include "fetch.h"
e7106e
@@ -57,7 +58,7 @@ struct fetch_context {
e7106e
 	arch_addr_t stack_pointer;
e7106e
 	int greg;
e7106e
 	int freg;
e7106e
-	int ret_struct;
e7106e
+	bool ret_struct;
e7106e
 
e7106e
 	union {
e7106e
 		gregs32_t r32;
e7106e
@@ -65,11 +66,29 @@ struct fetch_context {
e7106e
 	} regs;
e7106e
 	struct fpregs_t fpregs;
e7106e
 	int vgreg;
e7106e
-	int struct_size;
e7106e
-	int struct_hfa_size;
e7106e
-	int struct_hfa_count;
e7106e
 };
e7106e
 
e7106e
+static bool
e7106e
+is_eligible_hfa(struct arg_type_info *info,
e7106e
+		struct arg_type_info **hfa_infop, size_t *hfa_countp)
e7106e
+{
e7106e
+	size_t hfa_count;
e7106e
+	struct arg_type_info *hfa_info = type_get_hfa_type(info, &hfa_count);
e7106e
+
e7106e
+	if (hfa_info != NULL && hfa_count <= 8
e7106e
+	    && (hfa_info->type == ARGTYPE_FLOAT
e7106e
+		|| hfa_info->type == ARGTYPE_DOUBLE)) {
e7106e
+
e7106e
+		if (hfa_infop != NULL)
e7106e
+			*hfa_infop = hfa_info;
e7106e
+		if (hfa_countp != NULL)
e7106e
+			*hfa_countp = hfa_count;
e7106e
+		return true;
e7106e
+	}
e7106e
+
e7106e
+	return false;
e7106e
+}
e7106e
+
e7106e
 static int
e7106e
 fetch_context_init(struct process *proc, struct fetch_context *context)
e7106e
 {
e7106e
@@ -125,30 +144,37 @@ arch_fetch_arg_init(enum tof type, struct process *proc,
e7106e
 	}
e7106e
 
e7106e
 	context->vgreg = context->greg;
e7106e
-	context->struct_size = 0;
e7106e
-	context->struct_hfa_size = 0;
e7106e
-	context->struct_hfa_count = 0;
e7106e
 
e7106e
 	/* Aggregates or unions of any length, and character strings
e7106e
 	 * of length longer than 8 bytes, will be returned in a
e7106e
 	 * storage buffer allocated by the caller. The caller will
e7106e
 	 * pass the address of this buffer as a hidden first argument
e7106e
 	 * in r3, causing the first explicit argument to be passed in
e7106e
-	 * r4.  */
e7106e
-	context->ret_struct = ret_info->type == ARGTYPE_STRUCT;
e7106e
-	if (context->ret_struct) {
e7106e
-#if _CALL_ELF == 2
e7106e
-		/* if R3 points to stack, parameters will be in R4.  */
e7106e
-		uint64_t pstack_end = ptrace(PTRACE_PEEKTEXT, proc->pid,
e7106e
-					proc->stack_pointer, 0);
e7106e
-		if (((arch_addr_t)context->regs.r64[3] > proc->stack_pointer)
e7106e
-		    && (context->regs.r64[3] < pstack_end)) {
e7106e
+	 * r4.
e7106e
+	 */
e7106e
+
e7106e
+	context->ret_struct = false;
e7106e
+
e7106e
+	if (ppc64_call_elf_abi == 2) {
e7106e
+		/* With ELFv2 ABI, aggregates that consist
e7106e
+		 * (recursively) only of members of the same
e7106e
+		 * floating-point or vector type, are passed in a
e7106e
+		 * series of floating-point resp. vector registers.
e7106e
+		 * Additionally, when returning any aggregate of up to
e7106e
+		 * 16 bytes, general-purpose registers are used.  */
e7106e
+
e7106e
+		if (ret_info->type == ARGTYPE_STRUCT
e7106e
+		    && ! is_eligible_hfa(ret_info, NULL, NULL)
e7106e
+		    && type_sizeof(proc, ret_info) > 16) {
e7106e
+
e7106e
+			context->ret_struct = true;
e7106e
 			context->greg++;
e7106e
 			context->stack_pointer += 8;
e7106e
 		}
e7106e
-#else
e7106e
+
e7106e
+	} else if (ret_info->type == ARGTYPE_STRUCT) {
e7106e
+		context->ret_struct = true;
e7106e
 		context->greg++;
e7106e
-#endif
e7106e
 	}
e7106e
 
e7106e
 	return context;
e7106e
@@ -176,17 +202,16 @@ allocate_stack_slot(struct fetch_context *ctx, struct process *proc,
e7106e
 
e7106e
 	size_t a = type_alignof(proc, info);
e7106e
 	size_t off = 0;
e7106e
-	if (proc->e_machine == EM_PPC && a < 4)
e7106e
-		a = 4;
e7106e
-#if _CALL_ELF == 2
e7106e
-	else if (proc->e_machine == EM_PPC64 && sz == 4 && is_hfa_type)
e7106e
+	if (proc->e_machine == EM_PPC && a < 4) {
e7106e
 		a = 4;
e7106e
-	else
e7106e
-		a = 8;
e7106e
-#else
e7106e
-	else if (proc->e_machine == EM_PPC64 && a < 8)
e7106e
-#endif
e7106e
+	} else if (ppc64_call_elf_abi == 2) {
e7106e
+		if (proc->e_machine == EM_PPC64 && sz == 4 && is_hfa_type) {
e7106e
+			a = 4;
e7106e
+		} else
e7106e
+			a = 8;
e7106e
+	} else if (proc->e_machine == EM_PPC64 && a < 8) {
e7106e
 		a = 8;
e7106e
+	}
e7106e
 
e7106e
 	/* XXX Remove the two double casts when arch_addr_t
e7106e
 	 * becomes integral type.  */
e7106e
@@ -259,18 +284,19 @@ allocate_gpr(struct fetch_context *ctx, struct process *proc,
e7106e
 	if (sz == (size_t)-1)
e7106e
 		return -1;
e7106e
 	assert(sz == 1 || sz == 2 || sz == 4 || sz == 8);
e7106e
-#if _CALL_ELF == 2
e7106e
-	/* Consume the stack slot corresponding to this arg.  */
e7106e
-	if ((sz + off) >= 8)
e7106e
-		ctx->greg++;
e7106e
 
e7106e
-	if (is_hfa_type)
e7106e
-		ctx->stack_pointer += sz;
e7106e
-	else
e7106e
-		ctx->stack_pointer += 8;
e7106e
-#else
e7106e
-	ctx->greg++;
e7106e
-#endif
e7106e
+	if (ppc64_call_elf_abi == 2) {
e7106e
+		/* Consume the stack slot corresponding to this arg.  */
e7106e
+		if ((sz + off) >= 8)
e7106e
+			ctx->greg++;
e7106e
+
e7106e
+		if (is_hfa_type)
e7106e
+			ctx->stack_pointer += sz;
e7106e
+		else
e7106e
+			ctx->stack_pointer += 8;
e7106e
+	} else {
e7106e
+		ctx->greg++;
e7106e
+	}
e7106e
 
e7106e
 	if (valuep == NULL)
e7106e
 		return 0;
e7106e
@@ -326,7 +352,6 @@ allocate_float(struct fetch_context *ctx, struct process *proc,
e7106e
 	return allocate_stack_slot(ctx, proc, info, valuep, is_hfa_type);
e7106e
 }
e7106e
 
e7106e
-#if _CALL_ELF == 2
e7106e
 static int
e7106e
 allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 	     struct arg_type_info *info, struct value *valuep,
e7106e
@@ -336,27 +361,27 @@ allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 	if (sz == (size_t)-1)
e7106e
 		return -1;
e7106e
 
e7106e
-	ctx->struct_hfa_size += sz;
e7106e
-
e7106e
 	/* There are two changes regarding structure return types:
e7106e
-	 * * heterogeneous float/vector structs are returned
e7106e
-	 *   in (multiple) FP/vector registers,
e7106e
-	 *   instead of via implicit reference.
e7106e
-	 * * small structs (up to 16 bytes) are return
e7106e
-	 *   in one or two GPRs, instead of via implicit reference.
e7106e
+	 * * heterogeneous float/vector structs are returned in
e7106e
+	 *   (multiple) FP/vector registers, instead of via implicit
e7106e
+	 *   reference.
e7106e
+	 * * small structs (up to 16 bytes) are return in one or two
e7106e
+	 *   GPRs, instead of via implicit reference.
e7106e
 	 *
e7106e
 	 * Other structures (larger than 16 bytes, not heterogeneous)
e7106e
 	 * are still returned via implicit reference (i.e. a pointer
e7106e
 	 * to memory where to return the struct being passed in r3).
e7106e
-	 * Of course, whether or not an implicit reference pointer
e7106e
-	 * is present will shift the remaining arguments,
e7106e
-	 * so you need to get this right for ELFv2 in order
e7106e
-	 * to get the arguments correct.
e7106e
+	 * Of course, whether or not an implicit reference pointer is
e7106e
+	 * present will shift the remaining arguments, so you need to
e7106e
+	 * get this right for ELFv2 in order to get the arguments
e7106e
+	 * correct.
e7106e
+	 *
e7106e
 	 * If an actual parameter is known to correspond to an HFA
e7106e
 	 * formal parameter, each element is passed in the next
e7106e
 	 * available floating-point argument register starting at fp1
e7106e
 	 * until the fp13. The remaining elements of the aggregate are
e7106e
-	 * passed on the stack.  */
e7106e
+	 * passed on the stack.
e7106e
+	 */
e7106e
 	size_t slot_off = 0;
e7106e
 
e7106e
 	unsigned char *buf = value_reserve(valuep, sz);
e7106e
@@ -366,26 +391,17 @@ allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 	struct arg_type_info *hfa_info = type_get_simple(hfa_type);
e7106e
 	size_t hfa_sz = type_sizeof(proc, hfa_info);
e7106e
 
e7106e
-	if (hfa_count > 8)
e7106e
-		ctx->struct_hfa_count += hfa_count;
e7106e
-
e7106e
 	while (hfa_count > 0 && ctx->freg <= 13) {
e7106e
-		int rc;
e7106e
 		struct value tmp;
e7106e
-
e7106e
 		value_init(&tmp, proc, NULL, hfa_info, 0);
e7106e
+		int rc = allocate_float(ctx, proc, hfa_info,
e7106e
+					&tmp, slot_off, true);
e7106e
+		if (rc == 0)
e7106e
+			memcpy(buf, value_get_data(&tmp, NULL), hfa_sz);
e7106e
+		value_destroy(&tmp);
e7106e
 
e7106e
-		/* Hetereogeneous struct - get value on GPR or stack.  */
e7106e
-		if (((hfa_type == ARGTYPE_FLOAT
e7106e
-		    || hfa_type == ARGTYPE_DOUBLE)
e7106e
-		      && hfa_count <= 8))
e7106e
-			rc = allocate_float(ctx, proc, hfa_info, &tmp,
e7106e
-						slot_off, true);
e7106e
-		else
e7106e
-			rc = allocate_gpr(ctx, proc, hfa_info, &tmp,
e7106e
-						slot_off, true);
e7106e
-
e7106e
-		memcpy(buf, value_get_data(&tmp, NULL), hfa_sz);
e7106e
+		if (rc < 0)
e7106e
+			return -1;
e7106e
 
e7106e
 		slot_off += hfa_sz;
e7106e
 		buf += hfa_sz;
e7106e
@@ -394,17 +410,13 @@ allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 			slot_off = 0;
e7106e
 			ctx->vgreg++;
e7106e
 		}
e7106e
-
e7106e
-		value_destroy(&tmp);
e7106e
-		if (rc < 0)
e7106e
-			return -1;
e7106e
 	}
e7106e
 	if (hfa_count == 0)
e7106e
 		return 0;
e7106e
 
e7106e
 	/* if no remaining FP, GPR corresponding to slot is used
e7106e
-	* Mostly it is in part of r10.  */
e7106e
-	if (ctx->struct_hfa_size <= 64 && ctx->vgreg == 10) {
e7106e
+	 * Mostly it is in part of r10.  */
e7106e
+	if (ctx->vgreg == 10) {
e7106e
 		while (ctx->vgreg <= 10) {
e7106e
 			struct value tmp;
e7106e
 			value_init(&tmp, proc, NULL, hfa_info, 0);
e7106e
@@ -428,11 +440,8 @@ allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 		}
e7106e
 	}
e7106e
 
e7106e
-	if (hfa_count == 0)
e7106e
-		return 0;
e7106e
-
e7106e
 	/* Remaining values are on stack */
e7106e
-	while (hfa_count) {
e7106e
+	while (hfa_count > 0) {
e7106e
 		struct value tmp;
e7106e
 		value_init(&tmp, proc, NULL, hfa_info, 0);
e7106e
 
e7106e
@@ -444,7 +453,6 @@ allocate_hfa(struct fetch_context *ctx, struct process *proc,
e7106e
 	}
e7106e
 	return 0;
e7106e
 }
e7106e
-#endif
e7106e
 
e7106e
 static int
e7106e
 allocate_argument(struct fetch_context *ctx, struct process *proc,
e7106e
@@ -459,24 +467,20 @@ allocate_argument(struct fetch_context *ctx, struct process *proc,
e7106e
 	case ARGTYPE_FLOAT:
e7106e
 	case ARGTYPE_DOUBLE:
e7106e
 		return allocate_float(ctx, proc, info, valuep,
e7106e
-					8 - type_sizeof(proc,info), false);
e7106e
+				      8 - type_sizeof(proc,info), false);
e7106e
 
e7106e
 	case ARGTYPE_STRUCT:
e7106e
 		if (proc->e_machine == EM_PPC) {
e7106e
 			if (value_pass_by_reference(valuep) < 0)
e7106e
 				return -1;
e7106e
-		} else {
e7106e
-#if _CALL_ELF == 2
e7106e
+		} else if (ppc64_call_elf_abi == 2) {
e7106e
 			struct arg_type_info *hfa_info;
e7106e
-			size_t hfa_size;
e7106e
-			hfa_info = type_get_hfa_type(info, &hfa_size);
e7106e
-			if (hfa_info != NULL ) {
e7106e
-				size_t sz = type_sizeof(proc, info);
e7106e
-				ctx->struct_size += sz;
e7106e
+			size_t hfa_count;
e7106e
+			if (is_eligible_hfa(info, &hfa_info, &hfa_count)) {
e7106e
 				return allocate_hfa(ctx, proc, info, valuep,
e7106e
-						hfa_info->type, hfa_size);
e7106e
+						hfa_info->type, hfa_count);
e7106e
 			}
e7106e
-#endif
e7106e
+		} else {
e7106e
 			/* PPC64: Fixed size aggregates and unions passed by
e7106e
 			 * value are mapped to as many doublewords of the
e7106e
 			 * parameter save area as the value uses in memory.
e7106e
@@ -510,9 +514,6 @@ allocate_argument(struct fetch_context *ctx, struct process *proc,
e7106e
 	if (sz == (size_t)-1)
e7106e
 		return -1;
e7106e
 
e7106e
-	if (ctx->ret_struct)
e7106e
-		ctx->struct_size += sz;
e7106e
-
e7106e
 	size_t slots = (sz + width - 1) / width;  /* Round up.  */
e7106e
 	unsigned char *buf = value_reserve(valuep, slots * width);
e7106e
 	if (buf == NULL)
e7106e
@@ -605,19 +606,7 @@ arch_fetch_retval(struct fetch_context *ctx, enum tof type,
e7106e
 	if (fetch_context_init(proc, ctx) < 0)
e7106e
 		return -1;
e7106e
 
e7106e
-#if _CALL_ELF == 2
e7106e
-	void *ptr = (void *)(ctx->regs.r64[1]+32);
e7106e
-	uint64_t val = ptrace(PTRACE_PEEKTEXT, proc->pid, ptr, 0);
e7106e
-
e7106e
-	if (ctx->ret_struct
e7106e
-	   && ((ctx->struct_size > 64
e7106e
-	      || ctx->struct_hfa_count > 8
e7106e
-	      || (ctx->struct_hfa_size == 0 && ctx->struct_size > 56)
e7106e
-	      || (ctx->regs.r64[3] == ctx->regs.r64[1]+32)
e7106e
-	      || (ctx->regs.r64[3] == val )))) {
e7106e
-#else
e7106e
 	if (ctx->ret_struct) {
e7106e
-#endif
e7106e
 		assert(info->type == ARGTYPE_STRUCT);
e7106e
 
e7106e
 		uint64_t addr = read_gpr(ctx, proc, 3);