Blame SOURCES/0001-arm64-Support-overflow-stack-panic.patch

e64a0b
From 995db8ab88916b6397676b67be98c0a4f82cca49 Mon Sep 17 00:00:00 2001
e64a0b
From: Hong YANG <hong.yang3@nio.com>
e64a0b
Date: Mon, 15 Nov 2021 15:41:01 +0800
e64a0b
Subject: [PATCH 1/3] arm64: Support overflow stack panic
e64a0b
e64a0b
Kernel commit <872d8327ce89> ("arm64: add VMAP_STACK overflow detection")
e64a0b
has supported the overflow stack exception handling. Without the patch, the
e64a0b
"bt" command will make crash generate a core dump because of segmentation
e64a0b
fault. With the patch, the "bt" command can display the overflow stack.
e64a0b
e64a0b
Before:
e64a0b
crash> bt
e64a0b
PID: 3607   TASK: ffffffcbf9a4da00  CPU: 2   COMMAND: "sh"
e64a0b
Segmentation fault (core dumped)
e64a0b
e64a0b
After:
e64a0b
crash> bt
e64a0b
PID: 3607   TASK: ffffffcbf9a4da00  CPU: 2   COMMAND: "sh"
e64a0b
 #0 [ffffffccbfd85f50] __delay at ffffff8008ceded8
e64a0b
...
e64a0b
 #5 [ffffffccbfd85fd0] emergency_restart at ffffff80080d49fc
e64a0b
 #6 [ffffffccbfd86140] panic at ffffff80080af4c0
e64a0b
 #7 [ffffffccbfd86150] nmi_panic at ffffff80080af150
e64a0b
 #8 [ffffffccbfd86190] handle_bad_stack at ffffff800808b0b8
e64a0b
 #9 [ffffffccbfd862d0] __bad_stack at ffffff800808285c
e64a0b
     PC: ffffff8008082e80  [el1_sync]
e64a0b
     LR: ffffff8000d6c214  [stack_overflow_demo+84]
e64a0b
     SP: ffffff1a79930070  PSTATE: 204003c5
e64a0b
    X29: ffffff8011b03d00  X28: ffffffcbf9a4da00  X27: ffffff8008e02000
e64a0b
    X26: 0000000000000040  X25: 0000000000000124  X24: ffffffcbf9a4da00
e64a0b
    X23: 0000007daec2e288  X22: ffffffcbfe03b800  X21: 0000007daec2e288
e64a0b
    X20: 0000000000000002  X19: 0000000000000002  X18: 0000000000000002
e64a0b
    X17: 00000000000003e7  X16: 0000000000000000  X15: 0000000000000000
e64a0b
    X14: ffffffcc17facb00  X13: ffffffccb4c25c00  X12: 0000000000000000
e64a0b
    X11: ffffffcc17fad660  X10: 0000000000000af0   X9: 0000000000000000
e64a0b
     X8: ffffff1a799334f0   X7: 0000000000000000   X6: 000000000000003f
e64a0b
     X5: 0000000000000040   X4: 0000000000000010   X3: 00000065981d07f0
e64a0b
     X2: 00000065981d07f0   X1: 0000000000000000   X0: ffffff1a799334f0
e64a0b
e64a0b
Signed-off-by: Hong YANG <hong.yang3@nio.com>
e64a0b
---
e64a0b
 arm64.c | 169 ++++++++++++++++++++++++++++++++++++++++++++++++++------
e64a0b
 defs.h  |   6 ++
e64a0b
 2 files changed, 159 insertions(+), 16 deletions(-)
e64a0b
e64a0b
diff --git a/arm64.c b/arm64.c
e64a0b
index 94681d1a37db..23c3d75d85aa 100644
e64a0b
--- a/arm64.c
e64a0b
+++ b/arm64.c
e64a0b
@@ -45,6 +45,7 @@ static int arm64_vtop_3level_4k(ulong, ulong, physaddr_t *, int);
e64a0b
 static int arm64_vtop_4level_4k(ulong, ulong, physaddr_t *, int);
e64a0b
 static ulong arm64_get_task_pgd(ulong);
e64a0b
 static void arm64_irq_stack_init(void);
e64a0b
+static void arm64_overflow_stack_init(void);
e64a0b
 static void arm64_stackframe_init(void);
e64a0b
 static int arm64_eframe_search(struct bt_info *);
e64a0b
 static int arm64_is_kernel_exception_frame(struct bt_info *, ulong);
e64a0b
@@ -63,6 +64,7 @@ static int arm64_get_dumpfile_stackframe(struct bt_info *, struct arm64_stackfra
e64a0b
 static int arm64_in_kdump_text(struct bt_info *, struct arm64_stackframe *);
e64a0b
 static int arm64_in_kdump_text_on_irq_stack(struct bt_info *);
e64a0b
 static int arm64_switch_stack(struct bt_info *, struct arm64_stackframe *, FILE *);
e64a0b
+static int arm64_switch_stack_from_overflow(struct bt_info *, struct arm64_stackframe *, FILE *);
e64a0b
 static int arm64_get_stackframe(struct bt_info *, struct arm64_stackframe *);
e64a0b
 static void arm64_get_stack_frame(struct bt_info *, ulong *, ulong *);
e64a0b
 static void arm64_gen_hidden_frame(struct bt_info *bt, ulong, struct arm64_stackframe *);
e64a0b
@@ -78,8 +80,11 @@ static int arm64_get_smp_cpus(void);
e64a0b
 static void arm64_clear_machdep_cache(void);
e64a0b
 static int arm64_on_process_stack(struct bt_info *, ulong);
e64a0b
 static int arm64_in_alternate_stack(int, ulong);
e64a0b
+static int arm64_in_alternate_stackv(int cpu, ulong stkptr, ulong *stacks, ulong stack_size);
e64a0b
 static int arm64_on_irq_stack(int, ulong);
e64a0b
+static int arm64_on_overflow_stack(int, ulong);
e64a0b
 static void arm64_set_irq_stack(struct bt_info *);
e64a0b
+static void arm64_set_overflow_stack(struct bt_info *);
e64a0b
 static void arm64_set_process_stack(struct bt_info *);
e64a0b
 static int arm64_get_kvaddr_ranges(struct vaddr_range *);
e64a0b
 static void arm64_get_crash_notes(void);
e64a0b
@@ -463,6 +468,7 @@ arm64_init(int when)
e64a0b
 			machdep->hz = 100;
e64a0b
 
e64a0b
 		arm64_irq_stack_init();
e64a0b
+		arm64_overflow_stack_init();
e64a0b
 		arm64_stackframe_init();
e64a0b
 		break;
e64a0b
 
e64a0b
@@ -1715,6 +1721,49 @@ arm64_irq_stack_init(void)
e64a0b
 	} 
e64a0b
 }
e64a0b
 
e64a0b
+/*
e64a0b
+ *  Gather Overflow stack values.
e64a0b
+ *
e64a0b
+ *  Overflow stack supported since 4.14, in commit 872d8327c
e64a0b
+ */
e64a0b
+static void
e64a0b
+arm64_overflow_stack_init(void)
e64a0b
+{
e64a0b
+	int i;
e64a0b
+	struct syment *sp;
e64a0b
+	struct gnu_request request, *req;
e64a0b
+	struct machine_specific *ms = machdep->machspec;
e64a0b
+	req = &request;
e64a0b
+
e64a0b
+	if (symbol_exists("overflow_stack") &&
e64a0b
+	    (sp = per_cpu_symbol_search("overflow_stack")) &&
e64a0b
+	    get_symbol_type("overflow_stack", NULL, req)) {
e64a0b
+		if (CRASHDEBUG(1)) {
e64a0b
+			fprintf(fp, "overflow_stack: \n");
e64a0b
+			fprintf(fp, "  type: %x, %s\n",
e64a0b
+				(int)req->typecode,
e64a0b
+				(req->typecode == TYPE_CODE_ARRAY) ?
e64a0b
+						"TYPE_CODE_ARRAY" : "other");
e64a0b
+			fprintf(fp, "  target_typecode: %x, %s\n",
e64a0b
+				(int)req->target_typecode,
e64a0b
+				req->target_typecode == TYPE_CODE_INT ?
e64a0b
+						"TYPE_CODE_INT" : "other");
e64a0b
+			fprintf(fp, "  target_length: %ld\n",
e64a0b
+						req->target_length);
e64a0b
+			fprintf(fp, "  length: %ld\n", req->length);
e64a0b
+		}
e64a0b
+
e64a0b
+		if (!(ms->overflow_stacks = (ulong *)malloc((size_t)(kt->cpus * sizeof(ulong)))))
e64a0b
+			error(FATAL, "cannot malloc overflow_stack addresses\n");
e64a0b
+
e64a0b
+		ms->overflow_stack_size = ARM64_OVERFLOW_STACK_SIZE;
e64a0b
+		machdep->flags |= OVERFLOW_STACKS;
e64a0b
+
e64a0b
+		for (i = 0; i < kt->cpus; i++)
e64a0b
+			ms->overflow_stacks[i] = kt->__per_cpu_offset[i] + sp->value;
e64a0b
+	}
e64a0b
+}
e64a0b
+
e64a0b
 /*
e64a0b
  *  Gather and verify all of the backtrace requirements.
e64a0b
  */
e64a0b
@@ -1960,6 +2009,7 @@ static char *arm64_exception_functions[] = {
e64a0b
         "do_mem_abort",
e64a0b
         "do_el0_irq_bp_hardening",
e64a0b
         "do_sp_pc_abort",
e64a0b
+        "handle_bad_stack",
e64a0b
         NULL
e64a0b
 };
e64a0b
 
e64a0b
@@ -1978,7 +2028,10 @@ arm64_in_exception_text(ulong ptr)
e64a0b
 		if ((ptr >= ms->__exception_text_start) &&
e64a0b
 		    (ptr < ms->__exception_text_end))
e64a0b
 			return TRUE;
e64a0b
-	} else if ((name = closest_symbol(ptr))) {  /* Linux 5.5 and later */
e64a0b
+	}
e64a0b
+
e64a0b
+	name = closest_symbol(ptr);
e64a0b
+	if (name != NULL) { /* Linux 5.5 and later */
e64a0b
 		for (func = &arm64_exception_functions[0]; *func; func++) {
e64a0b
 			if (STREQ(name, *func))
e64a0b
 				return TRUE;
e64a0b
@@ -2252,15 +2305,14 @@ arm64_unwind_frame(struct bt_info *bt, struct arm64_stackframe *frame)
e64a0b
 	if ((frame->fp == 0) && (frame->pc == 0))
e64a0b
 		return FALSE;
e64a0b
 
e64a0b
-	if (!(machdep->flags & IRQ_STACKS))
e64a0b
-		return TRUE;
e64a0b
-
e64a0b
-	if (!(machdep->flags & IRQ_STACKS))
e64a0b
+	if (!(machdep->flags & (IRQ_STACKS | OVERFLOW_STACKS)))
e64a0b
 		return TRUE;
e64a0b
 
e64a0b
 	if (machdep->flags & UNW_4_14) {
e64a0b
-		if ((bt->flags & BT_IRQSTACK) &&
e64a0b
-		    !arm64_on_irq_stack(bt->tc->processor, frame->fp)) {
e64a0b
+		if (((bt->flags & BT_IRQSTACK) &&
e64a0b
+		     !arm64_on_irq_stack(bt->tc->processor, frame->fp)) ||
e64a0b
+		    ((bt->flags & BT_OVERFLOW_STACK) &&
e64a0b
+		     !arm64_on_overflow_stack(bt->tc->processor, frame->fp))) {
e64a0b
 			if (arm64_on_process_stack(bt, frame->fp)) {
e64a0b
 				arm64_set_process_stack(bt);
e64a0b
 
e64a0b
@@ -2677,6 +2729,9 @@ arm64_back_trace_cmd(struct bt_info *bt)
e64a0b
 		if (arm64_on_irq_stack(bt->tc->processor, bt->frameptr)) {
e64a0b
 			arm64_set_irq_stack(bt);
e64a0b
 			bt->flags |= BT_IRQSTACK;
e64a0b
+		} else if (arm64_on_overflow_stack(bt->tc->processor, bt->frameptr)) {
e64a0b
+			arm64_set_overflow_stack(bt);
e64a0b
+			bt->flags |= BT_OVERFLOW_STACK;
e64a0b
 		}
e64a0b
 		stackframe.sp = bt->stkptr;
e64a0b
 		stackframe.pc = bt->instptr;
e64a0b
@@ -2731,7 +2786,9 @@ arm64_back_trace_cmd(struct bt_info *bt)
e64a0b
 			break;
e64a0b
 
e64a0b
 		if (arm64_in_exception_text(bt->instptr) && INSTACK(stackframe.fp, bt)) {
e64a0b
-			if (!(bt->flags & BT_IRQSTACK) ||
e64a0b
+			if (bt->flags & BT_OVERFLOW_STACK) {
e64a0b
+				exception_frame = stackframe.fp - KERN_EFRAME_OFFSET;
e64a0b
+			} else if (!(bt->flags & BT_IRQSTACK) ||
e64a0b
 			    ((stackframe.sp + SIZE(pt_regs)) < bt->stacktop)) {
e64a0b
 				if (arm64_is_kernel_exception_frame(bt, stackframe.fp - KERN_EFRAME_OFFSET))
e64a0b
 					exception_frame = stackframe.fp - KERN_EFRAME_OFFSET;
e64a0b
@@ -2745,6 +2802,12 @@ arm64_back_trace_cmd(struct bt_info *bt)
e64a0b
 				break;
e64a0b
 		}
e64a0b
 
e64a0b
+		if ((bt->flags & BT_OVERFLOW_STACK) &&
e64a0b
+		    !arm64_on_overflow_stack(bt->tc->processor, stackframe.fp)) {
e64a0b
+			bt->flags &= ~BT_OVERFLOW_STACK;
e64a0b
+			if (arm64_switch_stack_from_overflow(bt, &stackframe, ofp) == USER_MODE)
e64a0b
+				break;
e64a0b
+		}
e64a0b
 
e64a0b
 		level++;
e64a0b
 	}
e64a0b
@@ -3131,6 +3194,43 @@ arm64_switch_stack(struct bt_info *bt, struct arm64_stackframe *frame, FILE *ofp
e64a0b
 	return KERNEL_MODE;
e64a0b
 }
e64a0b
 
e64a0b
+static int
e64a0b
+arm64_switch_stack_from_overflow(struct bt_info *bt, struct arm64_stackframe *frame, FILE *ofp)
e64a0b
+{
e64a0b
+	int i;
e64a0b
+	ulong stacktop, words, addr;
e64a0b
+	ulong *stackbuf;
e64a0b
+	char buf[BUFSIZE];
e64a0b
+	struct machine_specific *ms = machdep->machspec;
e64a0b
+
e64a0b
+	if (bt->flags & BT_FULL) {
e64a0b
+		stacktop = ms->overflow_stacks[bt->tc->processor] + ms->overflow_stack_size;
e64a0b
+		words = (stacktop - bt->bptr) / sizeof(ulong);
e64a0b
+		stackbuf = (ulong *)GETBUF(words * sizeof(ulong));
e64a0b
+		readmem(bt->bptr, KVADDR, stackbuf, words * sizeof(long),
e64a0b
+			"top of overflow stack", FAULT_ON_ERROR);
e64a0b
+
e64a0b
+		addr = bt->bptr;
e64a0b
+		for (i = 0; i < words; i++) {
e64a0b
+			if (!(i & 1))
e64a0b
+				fprintf(ofp, "%s    %lx: ", i ? "\n" : "", addr);
e64a0b
+			fprintf(ofp, "%s ", format_stack_entry(bt, buf, stackbuf[i], 0));
e64a0b
+			addr += sizeof(ulong);
e64a0b
+		}
e64a0b
+		fprintf(ofp, "\n");
e64a0b
+		FREEBUF(stackbuf);
e64a0b
+	}
e64a0b
+	fprintf(ofp, "--- <Overflow stack> ---\n");
e64a0b
+
e64a0b
+	if (frame->fp == 0)
e64a0b
+		return USER_MODE;
e64a0b
+
e64a0b
+	if (!(machdep->flags & UNW_4_14))
e64a0b
+		arm64_print_exception_frame(bt, frame->sp, KERNEL_MODE, ofp);
e64a0b
+
e64a0b
+	return KERNEL_MODE;
e64a0b
+}
e64a0b
+
e64a0b
 static int
e64a0b
 arm64_get_dumpfile_stackframe(struct bt_info *bt, struct arm64_stackframe *frame)
e64a0b
 {
e64a0b
@@ -3682,6 +3782,16 @@ arm64_display_machine_stats(void)
e64a0b
 				machdep->machspec->irq_stacks[i]);
e64a0b
 		}
e64a0b
 	}
e64a0b
+	if (machdep->machspec->overflow_stack_size) {
e64a0b
+		fprintf(fp, "OVERFLOW STACK SIZE: %ld\n",
e64a0b
+			machdep->machspec->overflow_stack_size);
e64a0b
+		fprintf(fp, "    OVERFLOW STACKS:\n");
e64a0b
+		for (i = 0; i < kt->cpus; i++) {
e64a0b
+			pad = (i < 10) ? 3 : (i < 100) ? 2 : (i < 1000) ? 1 : 0;
e64a0b
+			fprintf(fp, "%s           CPU %d: %lx\n", space(pad), i,
e64a0b
+				machdep->machspec->overflow_stacks[i]);
e64a0b
+		}
e64a0b
+	}
e64a0b
 }
e64a0b
 
e64a0b
 static int
e64a0b
@@ -3875,24 +3985,41 @@ arm64_on_process_stack(struct bt_info *bt, ulong stkptr)
e64a0b
 }
e64a0b
 
e64a0b
 static int
e64a0b
-arm64_on_irq_stack(int cpu, ulong stkptr)
e64a0b
+arm64_in_alternate_stackv(int cpu, ulong stkptr, ulong *stacks, ulong stack_size)
e64a0b
 {
e64a0b
-	return arm64_in_alternate_stack(cpu, stkptr);
e64a0b
+	if ((cpu >= kt->cpus) || (stacks == NULL) || !stack_size)
e64a0b
+		return FALSE;
e64a0b
+
e64a0b
+	if ((stkptr >= stacks[cpu]) &&
e64a0b
+	    (stkptr < (stacks[cpu] + stack_size)))
e64a0b
+		return TRUE;
e64a0b
+
e64a0b
+	return FALSE;
e64a0b
 }
e64a0b
 
e64a0b
 static int
e64a0b
 arm64_in_alternate_stack(int cpu, ulong stkptr)
e64a0b
+{
e64a0b
+	return (arm64_on_irq_stack(cpu, stkptr) ||
e64a0b
+		arm64_on_overflow_stack(cpu, stkptr));
e64a0b
+}
e64a0b
+
e64a0b
+static int
e64a0b
+arm64_on_irq_stack(int cpu, ulong stkptr)
e64a0b
 {
e64a0b
 	struct machine_specific *ms = machdep->machspec;
e64a0b
 
e64a0b
-	if (!ms->irq_stack_size || (cpu >= kt->cpus))
e64a0b
-		return FALSE;
e64a0b
+	return arm64_in_alternate_stackv(cpu, stkptr,
e64a0b
+			ms->irq_stacks, ms->irq_stack_size);
e64a0b
+}
e64a0b
 
e64a0b
-	if ((stkptr >= ms->irq_stacks[cpu]) &&
e64a0b
-	    (stkptr < (ms->irq_stacks[cpu] + ms->irq_stack_size)))
e64a0b
-		return TRUE;
e64a0b
+static int
e64a0b
+arm64_on_overflow_stack(int cpu, ulong stkptr)
e64a0b
+{
e64a0b
+	struct machine_specific *ms = machdep->machspec;
e64a0b
 
e64a0b
-	return FALSE;
e64a0b
+	return arm64_in_alternate_stackv(cpu, stkptr,
e64a0b
+			ms->overflow_stacks, ms->overflow_stack_size);
e64a0b
 }
e64a0b
 
e64a0b
 static void
e64a0b
@@ -3905,6 +4032,16 @@ arm64_set_irq_stack(struct bt_info *bt)
e64a0b
 	alter_stackbuf(bt);
e64a0b
 }
e64a0b
 
e64a0b
+static void
e64a0b
+arm64_set_overflow_stack(struct bt_info *bt)
e64a0b
+{
e64a0b
+	struct machine_specific *ms = machdep->machspec;
e64a0b
+
e64a0b
+	bt->stackbase = ms->overflow_stacks[bt->tc->processor];
e64a0b
+	bt->stacktop = bt->stackbase + ms->overflow_stack_size;
e64a0b
+	alter_stackbuf(bt);
e64a0b
+}
e64a0b
+
e64a0b
 static void
e64a0b
 arm64_set_process_stack(struct bt_info *bt)
e64a0b
 {
e64a0b
diff --git a/defs.h b/defs.h
e64a0b
index a2f30853a4b1..7e2a16e34a59 100644
e64a0b
--- a/defs.h
e64a0b
+++ b/defs.h
e64a0b
@@ -3218,6 +3218,7 @@ typedef signed int s32;
e64a0b
 #define UNW_4_14      (0x200)
e64a0b
 #define FLIPPED_VM    (0x400)
e64a0b
 #define HAS_PHYSVIRT_OFFSET (0x800)
e64a0b
+#define OVERFLOW_STACKS     (0x1000)
e64a0b
 
e64a0b
 /*
e64a0b
  * Get kimage_voffset from /dev/crash
e64a0b
@@ -3260,6 +3261,7 @@ typedef signed int s32;
e64a0b
 
e64a0b
 #define ARM64_STACK_SIZE   (16384)
e64a0b
 #define ARM64_IRQ_STACK_SIZE   ARM64_STACK_SIZE
e64a0b
+#define ARM64_OVERFLOW_STACK_SIZE   (4096)
e64a0b
 
e64a0b
 #define _SECTION_SIZE_BITS           30
e64a0b
 #define _SECTION_SIZE_BITS_5_12      27
e64a0b
@@ -3332,6 +3334,9 @@ struct machine_specific {
e64a0b
 	char  *irq_stackbuf;
e64a0b
 	ulong __irqentry_text_start;
e64a0b
 	ulong __irqentry_text_end;
e64a0b
+	ulong overflow_stack_size;
e64a0b
+	ulong *overflow_stacks;
e64a0b
+	char  *overflow_stackbuf;
e64a0b
 	/* for exception vector code */
e64a0b
 	ulong exp_entry1_start;
e64a0b
 	ulong exp_entry1_end;
e64a0b
@@ -5770,6 +5775,7 @@ ulong cpu_map_addr(const char *type);
e64a0b
 #define BT_CPUMASK        (0x1000000000000ULL)
e64a0b
 #define BT_SHOW_ALL_REGS  (0x2000000000000ULL)
e64a0b
 #define BT_REGS_NOT_FOUND (0x4000000000000ULL)
e64a0b
+#define BT_OVERFLOW_STACK (0x8000000000000ULL)
e64a0b
 #define BT_SYMBOL_OFFSET   (BT_SYMBOLIC_ARGS)
e64a0b
 
e64a0b
 #define BT_REF_HEXVAL         (0x1)
e64a0b
-- 
e64a0b
2.30.2
e64a0b