51f0aa
Backport of this upstream patch:
51f0aa
51f0aa
commit 031e519c95c069abe4e4c7c59e2b4b67efccdee5
51f0aa
Author: H.J. Lu <hjl.tools@gmail.com>
51f0aa
Date:   Thu Jul 6 04:43:06 2017 -0700
51f0aa
51f0aa
    x86-64: Align the stack in __tls_get_addr [BZ #21609]
51f0aa
    
51f0aa
    This change forces realignment of the stack pointer in __tls_get_addr, so
51f0aa
    that binaries compiled by GCCs older than GCC 4.9:
51f0aa
    
51f0aa
    https://gcc.gnu.org/bugzilla/show_bug.cgi?id=58066
51f0aa
    
51f0aa
    continue to work even if vector instructions are used in glibc which
51f0aa
    require the ABI stack realignment.
51f0aa
    
51f0aa
    __tls_get_addr_slow is added to handle the slow paths in the default
51f0aa
    implementation of__tls_get_addr in elf/dl-tls.c.  The new __tls_get_addr
51f0aa
    calls __tls_get_addr_slow after realigning the stack.  Internal calls
51f0aa
    within ld.so go directly to the default implementation of __tls_get_addr
51f0aa
    because they do not need stack realignment.
51f0aa
    
51f0aa
            [BZ #21609]
51f0aa
            * sysdeps/x86_64/Makefile (sysdep-dl-routines): Add tls_get_addr.
51f0aa
            (gen-as-const-headers): Add rtld-offsets.sym.
51f0aa
            * sysdeps/x86_64/dl-tls.c: New file.
51f0aa
            * sysdeps/x86_64/rtld-offsets.sym: Likwise.
51f0aa
            * sysdeps/x86_64/tls_get_addr.S: Likewise.
51f0aa
            * sysdeps/x86_64/dl-tls.h: Add multiple inclusion guards.
51f0aa
            * sysdeps/x86_64/tlsdesc.sym (TI_MODULE_OFFSET): New.
51f0aa
            (TI_OFFSET_OFFSET): Likwise.
51f0aa
51f0aa
Adjusted for drift in sysdeps/x86_64/Makefile and lack of
51f0aa
TLS_DTV_UNALLOCATED consolidation (upstream commit
51f0aa
aca1daef298b43bd7b1987b31f5aabcf6c2f6021).
51f0aa
51f0aa
diff --git a/sysdeps/x86_64/Makefile b/sysdeps/x86_64/Makefile
51f0aa
index 6c03a89fb3ea3063..c6766bb2b443a28a 100644
51f0aa
--- a/sysdeps/x86_64/Makefile
51f0aa
+++ b/sysdeps/x86_64/Makefile
51f0aa
@@ -19,7 +19,7 @@ gen-as-const-headers += locale-defines.sym
51f0aa
 endif
51f0aa
 
51f0aa
 ifeq ($(subdir),elf)
51f0aa
-sysdep-dl-routines += tlsdesc dl-tlsdesc
51f0aa
+sysdep-dl-routines += tlsdesc dl-tlsdesc tls_get_addr
51f0aa
 
51f0aa
 tests += ifuncmain8
51f0aa
 modules-names += ifuncmod8
51f0aa
@@ -69,5 +69,5 @@ endif
51f0aa
 endif
51f0aa
 
51f0aa
 ifeq ($(subdir),csu)
51f0aa
-gen-as-const-headers += tlsdesc.sym
51f0aa
+gen-as-const-headers += tlsdesc.sym rtld-offsets.sym
51f0aa
 endif
51f0aa
diff --git a/sysdeps/x86_64/dl-tls.c b/sysdeps/x86_64/dl-tls.c
51f0aa
new file mode 100644
51f0aa
index 0000000000000000..3584805c8ecca59a
51f0aa
--- /dev/null
51f0aa
+++ b/sysdeps/x86_64/dl-tls.c
51f0aa
@@ -0,0 +1,53 @@
51f0aa
+/* Thread-local storage handling in the ELF dynamic linker.  x86-64 version.
51f0aa
+   Copyright (C) 2017 Free Software Foundation, Inc.
51f0aa
+   This file is part of the GNU C Library.
51f0aa
+
51f0aa
+   The GNU C Library is free software; you can redistribute it and/or
51f0aa
+   modify it under the terms of the GNU Lesser General Public
51f0aa
+   License as published by the Free Software Foundation; either
51f0aa
+   version 2.1 of the License, or (at your option) any later version.
51f0aa
+
51f0aa
+   The GNU C Library is distributed in the hope that it will be useful,
51f0aa
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
51f0aa
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
51f0aa
+   Lesser General Public License for more details.
51f0aa
+
51f0aa
+   You should have received a copy of the GNU Lesser General Public
51f0aa
+   License along with the GNU C Library; if not, see
51f0aa
+   <http://www.gnu.org/licenses/>.  */
51f0aa
+
51f0aa
+#ifdef SHARED
51f0aa
+/* Work around GCC PR58066, due to which __tls_get_addr may be called
51f0aa
+   with an unaligned stack.  The compat implementation is in
51f0aa
+   tls_get_addr-compat.S.  */
51f0aa
+
51f0aa
+# include <dl-tls.h>
51f0aa
+
51f0aa
+/* Define __tls_get_addr within elf/dl-tls.c under a different
51f0aa
+   name.  */
51f0aa
+extern __typeof__ (__tls_get_addr) ___tls_get_addr;
51f0aa
+
51f0aa
+# define __tls_get_addr ___tls_get_addr
51f0aa
+# include <elf/dl-tls.c>
51f0aa
+# undef __tls_get_addr
51f0aa
+
51f0aa
+hidden_ver (___tls_get_addr, __tls_get_addr)
51f0aa
+
51f0aa
+/* Only handle slow paths for __tls_get_addr.  */
51f0aa
+attribute_hidden
51f0aa
+void *
51f0aa
+__tls_get_addr_slow (GET_ADDR_ARGS)
51f0aa
+{
51f0aa
+  dtv_t *dtv = THREAD_DTV ();
51f0aa
+
51f0aa
+  if (__glibc_unlikely (dtv[0].counter != GL(dl_tls_generation)))
51f0aa
+    return update_get_addr (GET_ADDR_PARAM);
51f0aa
+
51f0aa
+  return tls_get_addr_tail (GET_ADDR_PARAM, dtv, NULL);
51f0aa
+}
51f0aa
+#else
51f0aa
+
51f0aa
+/* No compatibility symbol needed.  */
51f0aa
+# include <elf/dl-tls.c>
51f0aa
+
51f0aa
+#endif
51f0aa
diff --git a/sysdeps/x86_64/dl-tls.h b/sysdeps/x86_64/dl-tls.h
51f0aa
index 56162ee64a4aae7d..0b4a6b3b634a83f4 100644
51f0aa
--- a/sysdeps/x86_64/dl-tls.h
51f0aa
+++ b/sysdeps/x86_64/dl-tls.h
51f0aa
@@ -16,6 +16,10 @@
51f0aa
    License along with the GNU C Library; if not, see
51f0aa
    <http://www.gnu.org/licenses/>.  */
51f0aa
 
51f0aa
+#ifndef _X86_64_DL_TLS_H
51f0aa
+#define _X86_64_DL_TLS_H
51f0aa
+
51f0aa
+#include <stdint.h>
51f0aa
 
51f0aa
 /* Type used for the representation of TLS information in the GOT.  */
51f0aa
 typedef struct dl_tls_index
51f0aa
@@ -29,3 +33,5 @@ extern void *__tls_get_addr (tls_index *ti);
51f0aa
 
51f0aa
 /* Value used for dtv entries for which the allocation is delayed.  */
51f0aa
 #define TLS_DTV_UNALLOCATED	((void *) -1l)
51f0aa
+
51f0aa
+#endif /* _X86_64_DL_TLS_H */
51f0aa
diff --git a/sysdeps/x86_64/rtld-offsets.sym b/sysdeps/x86_64/rtld-offsets.sym
51f0aa
new file mode 100644
51f0aa
index 0000000000000000..fd41b51521ac80bd
51f0aa
--- /dev/null
51f0aa
+++ b/sysdeps/x86_64/rtld-offsets.sym
51f0aa
@@ -0,0 +1,6 @@
51f0aa
+#define SHARED
51f0aa
+#include <ldsodefs.h>
51f0aa
+
51f0aa
+--
51f0aa
+
51f0aa
+GL_TLS_GENERATION_OFFSET        offsetof (struct rtld_global, _dl_tls_generation)
51f0aa
diff --git a/sysdeps/x86_64/tls_get_addr.S b/sysdeps/x86_64/tls_get_addr.S
51f0aa
new file mode 100644
51f0aa
index 0000000000000000..9d38fb3be54fbcb5
51f0aa
--- /dev/null
51f0aa
+++ b/sysdeps/x86_64/tls_get_addr.S
51f0aa
@@ -0,0 +1,61 @@
51f0aa
+/* Stack-aligning implementation of __tls_get_addr.  x86-64 version.
51f0aa
+   Copyright (C) 2017 Free Software Foundation, Inc.
51f0aa
+   This file is part of the GNU C Library.
51f0aa
+
51f0aa
+   The GNU C Library is free software; you can redistribute it and/or
51f0aa
+   modify it under the terms of the GNU Lesser General Public
51f0aa
+   License as published by the Free Software Foundation; either
51f0aa
+   version 2.1 of the License, or (at your option) any later version.
51f0aa
+
51f0aa
+   The GNU C Library is distributed in the hope that it will be useful,
51f0aa
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
51f0aa
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
51f0aa
+   Lesser General Public License for more details.
51f0aa
+
51f0aa
+   You should have received a copy of the GNU Lesser General Public
51f0aa
+   License along with the GNU C Library; if not, see
51f0aa
+   <http://www.gnu.org/licenses/>.  */
51f0aa
+
51f0aa
+#ifdef SHARED
51f0aa
+
51f0aa
+# include <sysdep.h>
51f0aa
+# include "tlsdesc.h"
51f0aa
+# include "rtld-offsets.h"
51f0aa
+
51f0aa
+/* See __tls_get_addr and __tls_get_addr_slow in dl-tls.c.  This function
51f0aa
+   call __tls_get_addr_slow on both slow paths.  It realigns the stack
51f0aa
+   before the call to work around GCC PR58066.  */
51f0aa
+
51f0aa
+ENTRY (__tls_get_addr)
51f0aa
+	mov 	%fs:DTV_OFFSET, %RDX_LP
51f0aa
+	mov	GL_TLS_GENERATION_OFFSET+_rtld_local(%rip), %RAX_LP
51f0aa
+	/* GL(dl_tls_generation) == dtv[0].counter */
51f0aa
+	cmp	%RAX_LP, (%rdx)
51f0aa
+	jne	1f
51f0aa
+	mov	TI_MODULE_OFFSET(%rdi), %RAX_LP
51f0aa
+	/* dtv[ti->ti_module] */
51f0aa
+# ifdef __LP64__
51f0aa
+	salq	$4, %rax
51f0aa
+	movq	(%rdx,%rax), %rax
51f0aa
+# else
51f0aa
+	movl	(%rdx,%rax, 8), %eax
51f0aa
+# endif
51f0aa
+	cmp	$-1, %RAX_LP
51f0aa
+	je	1f
51f0aa
+	add	TI_OFFSET_OFFSET(%rdi), %RAX_LP
51f0aa
+	ret
51f0aa
+1:
51f0aa
+	/* On the slow path, align the stack.  */
51f0aa
+	pushq	%rbp
51f0aa
+	cfi_def_cfa_offset (16)
51f0aa
+	cfi_offset (%rbp, -16)
51f0aa
+	mov	%RSP_LP, %RBP_LP
51f0aa
+	cfi_def_cfa_register (%rbp)
51f0aa
+	and	$-16, %RSP_LP
51f0aa
+	call	__tls_get_addr_slow
51f0aa
+	mov	%RBP_LP, %RSP_LP
51f0aa
+	popq	%rbp
51f0aa
+	cfi_def_cfa (%rsp, 8)
51f0aa
+	ret
51f0aa
+END (__tls_get_addr)
51f0aa
+#endif /* SHARED */
51f0aa
diff --git a/sysdeps/x86_64/tlsdesc.sym b/sysdeps/x86_64/tlsdesc.sym
51f0aa
index 33854975d04184b2..fc897ab4b522b1a9 100644
51f0aa
--- a/sysdeps/x86_64/tlsdesc.sym
51f0aa
+++ b/sysdeps/x86_64/tlsdesc.sym
51f0aa
@@ -15,3 +15,6 @@ TLSDESC_ARG			offsetof(struct tlsdesc, arg)
51f0aa
 TLSDESC_GEN_COUNT		offsetof(struct tlsdesc_dynamic_arg, gen_count)
51f0aa
 TLSDESC_MODID			offsetof(struct tlsdesc_dynamic_arg, tlsinfo.ti_module)
51f0aa
 TLSDESC_MODOFF			offsetof(struct tlsdesc_dynamic_arg, tlsinfo.ti_offset)
51f0aa
+
51f0aa
+TI_MODULE_OFFSET 		offsetof(tls_index, ti_module)
51f0aa
+TI_OFFSET_OFFSET 		offsetof(tls_index, ti_offset)