Blame SOURCES/gdb-linux_perf-bundle.patch

2f9ed3
From FEDORA_PATCHES Mon Sep 17 00:00:00 2001
2f9ed3
From: Fedora GDB patches <invalid@email.com>
2f9ed3
Date: Fri, 27 Oct 2017 21:07:50 +0200
2f9ed3
Subject: gdb-linux_perf-bundle.patch
2f9ed3
2f9ed3
;; [dts+el7] [x86*] Bundle linux_perf.h for libipt (RH BZ 1256513).
2f9ed3
;;=fedora
2f9ed3
2f9ed3
diff --git a/gdb/configure b/gdb/configure
2f9ed3
--- a/gdb/configure
2f9ed3
+++ b/gdb/configure
2f9ed3
@@ -12137,7 +12137,7 @@ else
2f9ed3
 
2f9ed3
 #include <linux/perf_event.h>
2f9ed3
 #ifndef PERF_ATTR_SIZE_VER5
2f9ed3
-# error
2f9ed3
+// error // PERF_ATTR_SIZE_VER5_BUNDLE is not available here - Fedora+RHEL
2f9ed3
 #endif
2f9ed3
 
2f9ed3
 _ACEOF
2f9ed3
diff --git a/gdb/configure.ac b/gdb/configure.ac
2f9ed3
--- a/gdb/configure.ac
2f9ed3
+++ b/gdb/configure.ac
2f9ed3
@@ -1500,7 +1500,7 @@ else
2f9ed3
   AC_PREPROC_IFELSE([AC_LANG_SOURCE([[
2f9ed3
 #include <linux/perf_event.h>
2f9ed3
 #ifndef PERF_ATTR_SIZE_VER5
2f9ed3
-# error
2f9ed3
+// error // PERF_ATTR_SIZE_VER5_BUNDLE is not available here - Fedora+RHEL
2f9ed3
 #endif
2f9ed3
   ]])], [perf_event=yes], [perf_event=no])
2f9ed3
   if test "$perf_event" != yes; then
2f9ed3
diff --git a/gdb/gdb.c b/gdb/gdb.c
2f9ed3
--- a/gdb/gdb.c
2f9ed3
+++ b/gdb/gdb.c
2f9ed3
@@ -20,11 +20,19 @@
2f9ed3
 #include "main.h"
2f9ed3
 #include "interps.h"
2f9ed3
 
2f9ed3
+#ifdef PERF_ATTR_SIZE_VER5_BUNDLE
2f9ed3
+extern "C" void __libipt_init(void);
2f9ed3
+#endif
2f9ed3
+
2f9ed3
 int
2f9ed3
 main (int argc, char **argv)
2f9ed3
 {
2f9ed3
   struct captured_main_args args;
2f9ed3
 
2f9ed3
+#ifdef PERF_ATTR_SIZE_VER5_BUNDLE
2f9ed3
+  __libipt_init();
2f9ed3
+#endif
2f9ed3
+
2f9ed3
   memset (&args, 0, sizeof args);
2f9ed3
   args.argc = argc;
2f9ed3
   args.argv = argv;
2f9ed3
diff --git a/gdb/nat/linux-btrace.h b/gdb/nat/linux-btrace.h
2f9ed3
--- a/gdb/nat/linux-btrace.h
2f9ed3
+++ b/gdb/nat/linux-btrace.h
2f9ed3
@@ -28,6 +28,177 @@
2f9ed3
 #  include <linux/perf_event.h>
2f9ed3
 #endif
2f9ed3
 
2f9ed3
+#ifdef PERF_ATTR_SIZE_VER5_BUNDLE
2f9ed3
+#ifndef HAVE_LINUX_PERF_EVENT_H
2f9ed3
+# error "PERF_ATTR_SIZE_VER5_BUNDLE && !HAVE_LINUX_PERF_EVENT_H"
2f9ed3
+#endif
2f9ed3
+#ifndef PERF_ATTR_SIZE_VER5
2f9ed3
+#define PERF_ATTR_SIZE_VER5
2f9ed3
+#define perf_event_mmap_page perf_event_mmap_page_bundle
2f9ed3
+// kernel-headers-3.10.0-493.el7.x86_64/usr/include/linux/perf_event.h
2f9ed3
+/*
2f9ed3
+ * Structure of the page that can be mapped via mmap
2f9ed3
+ */
2f9ed3
+struct perf_event_mmap_page {
2f9ed3
+	__u32	version;		/* version number of this structure */
2f9ed3
+	__u32	compat_version;		/* lowest version this is compat with */
2f9ed3
+
2f9ed3
+	/*
2f9ed3
+	 * Bits needed to read the hw events in user-space.
2f9ed3
+	 *
2f9ed3
+	 *   u32 seq, time_mult, time_shift, index, width;
2f9ed3
+	 *   u64 count, enabled, running;
2f9ed3
+	 *   u64 cyc, time_offset;
2f9ed3
+	 *   s64 pmc = 0;
2f9ed3
+	 *
2f9ed3
+	 *   do {
2f9ed3
+	 *     seq = pc->lock;
2f9ed3
+	 *     barrier()
2f9ed3
+	 *
2f9ed3
+	 *     enabled = pc->time_enabled;
2f9ed3
+	 *     running = pc->time_running;
2f9ed3
+	 *
2f9ed3
+	 *     if (pc->cap_usr_time && enabled != running) {
2f9ed3
+	 *       cyc = rdtsc();
2f9ed3
+	 *       time_offset = pc->time_offset;
2f9ed3
+	 *       time_mult   = pc->time_mult;
2f9ed3
+	 *       time_shift  = pc->time_shift;
2f9ed3
+	 *     }
2f9ed3
+	 *
2f9ed3
+	 *     index = pc->index;
2f9ed3
+	 *     count = pc->offset;
2f9ed3
+	 *     if (pc->cap_user_rdpmc && index) {
2f9ed3
+	 *       width = pc->pmc_width;
2f9ed3
+	 *       pmc = rdpmc(index - 1);
2f9ed3
+	 *     }
2f9ed3
+	 *
2f9ed3
+	 *     barrier();
2f9ed3
+	 *   } while (pc->lock != seq);
2f9ed3
+	 *
2f9ed3
+	 * NOTE: for obvious reason this only works on self-monitoring
2f9ed3
+	 *       processes.
2f9ed3
+	 */
2f9ed3
+	__u32	lock;			/* seqlock for synchronization */
2f9ed3
+	__u32	index;			/* hardware event identifier */
2f9ed3
+	__s64	offset;			/* add to hardware event value */
2f9ed3
+	__u64	time_enabled;		/* time event active */
2f9ed3
+	__u64	time_running;		/* time event on cpu */
2f9ed3
+	union {
2f9ed3
+		__u64	capabilities;
2f9ed3
+		struct {
2f9ed3
+			__u64	cap_bit0		: 1, /* Always 0, deprecated, see commit 860f085b74e9 */
2f9ed3
+				cap_bit0_is_deprecated	: 1, /* Always 1, signals that bit 0 is zero */
2f9ed3
+
2f9ed3
+				cap_user_rdpmc		: 1, /* The RDPMC instruction can be used to read counts */
2f9ed3
+				cap_user_time		: 1, /* The time_* fields are used */
2f9ed3
+				cap_user_time_zero	: 1, /* The time_zero field is used */
2f9ed3
+				cap_____res		: 59;
2f9ed3
+		};
2f9ed3
+	};
2f9ed3
+
2f9ed3
+	/*
2f9ed3
+	 * If cap_user_rdpmc this field provides the bit-width of the value
2f9ed3
+	 * read using the rdpmc() or equivalent instruction. This can be used
2f9ed3
+	 * to sign extend the result like:
2f9ed3
+	 *
2f9ed3
+	 *   pmc <<= 64 - width;
2f9ed3
+	 *   pmc >>= 64 - width; // signed shift right
2f9ed3
+	 *   count += pmc;
2f9ed3
+	 */
2f9ed3
+	__u16	pmc_width;
2f9ed3
+
2f9ed3
+	/*
2f9ed3
+	 * If cap_usr_time the below fields can be used to compute the time
2f9ed3
+	 * delta since time_enabled (in ns) using rdtsc or similar.
2f9ed3
+	 *
2f9ed3
+	 *   u64 quot, rem;
2f9ed3
+	 *   u64 delta;
2f9ed3
+	 *
2f9ed3
+	 *   quot = (cyc >> time_shift);
2f9ed3
+	 *   rem = cyc & (((u64)1 << time_shift) - 1);
2f9ed3
+	 *   delta = time_offset + quot * time_mult +
2f9ed3
+	 *              ((rem * time_mult) >> time_shift);
2f9ed3
+	 *
2f9ed3
+	 * Where time_offset,time_mult,time_shift and cyc are read in the
2f9ed3
+	 * seqcount loop described above. This delta can then be added to
2f9ed3
+	 * enabled and possible running (if index), improving the scaling:
2f9ed3
+	 *
2f9ed3
+	 *   enabled += delta;
2f9ed3
+	 *   if (index)
2f9ed3
+	 *     running += delta;
2f9ed3
+	 *
2f9ed3
+	 *   quot = count / running;
2f9ed3
+	 *   rem  = count % running;
2f9ed3
+	 *   count = quot * enabled + (rem * enabled) / running;
2f9ed3
+	 */
2f9ed3
+	__u16	time_shift;
2f9ed3
+	__u32	time_mult;
2f9ed3
+	__u64	time_offset;
2f9ed3
+	/*
2f9ed3
+	 * If cap_usr_time_zero, the hardware clock (e.g. TSC) can be calculated
2f9ed3
+	 * from sample timestamps.
2f9ed3
+	 *
2f9ed3
+	 *   time = timestamp - time_zero;
2f9ed3
+	 *   quot = time / time_mult;
2f9ed3
+	 *   rem  = time % time_mult;
2f9ed3
+	 *   cyc = (quot << time_shift) + (rem << time_shift) / time_mult;
2f9ed3
+	 *
2f9ed3
+	 * And vice versa:
2f9ed3
+	 *
2f9ed3
+	 *   quot = cyc >> time_shift;
2f9ed3
+	 *   rem  = cyc & (((u64)1 << time_shift) - 1);
2f9ed3
+	 *   timestamp = time_zero + quot * time_mult +
2f9ed3
+	 *               ((rem * time_mult) >> time_shift);
2f9ed3
+	 */
2f9ed3
+	__u64	time_zero;
2f9ed3
+	__u32	size;			/* Header size up to __reserved[] fields. */
2f9ed3
+
2f9ed3
+		/*
2f9ed3
+		 * Hole for extension of the self monitor capabilities
2f9ed3
+		 */
2f9ed3
+
2f9ed3
+	__u8	__reserved[118*8+4];	/* align to 1k. */
2f9ed3
+
2f9ed3
+	/*
2f9ed3
+	 * Control data for the mmap() data buffer.
2f9ed3
+	 *
2f9ed3
+	 * User-space reading the @data_head value should issue an smp_rmb(),
2f9ed3
+	 * after reading this value.
2f9ed3
+	 *
2f9ed3
+	 * When the mapping is PROT_WRITE the @data_tail value should be
2f9ed3
+	 * written by userspace to reflect the last read data, after issueing
2f9ed3
+	 * an smp_mb() to separate the data read from the ->data_tail store.
2f9ed3
+	 * In this case the kernel will not over-write unread data.
2f9ed3
+	 *
2f9ed3
+	 * See perf_output_put_handle() for the data ordering.
2f9ed3
+	 *
2f9ed3
+	 * data_{offset,size} indicate the location and size of the perf record
2f9ed3
+	 * buffer within the mmapped area.
2f9ed3
+	 */
2f9ed3
+	__u64   data_head;		/* head in the data section */
2f9ed3
+	__u64	data_tail;		/* user-space written tail */
2f9ed3
+	__u64	data_offset;		/* where the buffer starts */
2f9ed3
+	__u64	data_size;		/* data buffer size */
2f9ed3
+
2f9ed3
+	/*
2f9ed3
+	 * AUX area is defined by aux_{offset,size} fields that should be set
2f9ed3
+	 * by the userspace, so that
2f9ed3
+	 *
2f9ed3
+	 *   aux_offset >= data_offset + data_size
2f9ed3
+	 *
2f9ed3
+	 * prior to mmap()ing it. Size of the mmap()ed area should be aux_size.
2f9ed3
+	 *
2f9ed3
+	 * Ring buffer pointers aux_{head,tail} have the same semantics as
2f9ed3
+	 * data_{head,tail} and same ordering rules apply.
2f9ed3
+	 */
2f9ed3
+	__u64	aux_head;
2f9ed3
+	__u64	aux_tail;
2f9ed3
+	__u64	aux_offset;
2f9ed3
+	__u64	aux_size;
2f9ed3
+};
2f9ed3
+#endif // PERF_ATTR_SIZE_VER5
2f9ed3
+#endif // PERF_ATTR_SIZE_VER5_BUNDLE
2f9ed3
+
2f9ed3
 struct target_ops;
2f9ed3
 
2f9ed3
 #if HAVE_LINUX_PERF_EVENT_H