bdc76f
commit f0458cf4f9ff3d870c43b624e6dccaaf657d5e83
bdc76f
Author: Adhemerval Zanella <adhemerval.zanella@linaro.org>
bdc76f
Date:   Mon Aug 27 09:42:50 2018 -0300
bdc76f
bdc76f
    powerpc: Only enable TLE with PPC_FEATURE2_HTM_NOSC
bdc76f
    
bdc76f
    Linux from 3.9 through 4.2 does not abort HTM transaction on syscalls,
bdc76f
    instead it suspend and resume it when leaving the kernel.  The
bdc76f
    side-effects of the syscall will always remain visible, even if the
bdc76f
    transaction is aborted.  This is an issue when transaction is used along
bdc76f
    with futex syscall, on pthread_cond_wait for instance, where the futex
bdc76f
    call might succeed but the transaction is rolled back leading the
bdc76f
    pthread_cond object in an inconsistent state.
bdc76f
    
bdc76f
    Glibc used to prevent it by always aborting a transaction before issuing
bdc76f
    a syscall.  Linux 4.2 also decided to abort active transaction in
bdc76f
    syscalls which makes the glibc workaround superfluous.  Worse, glibc
bdc76f
    transaction abortion leads to a performance issue on recent kernels
bdc76f
    where the HTM state is saved/restore lazily (v4.9).  By aborting a
bdc76f
    transaction on every syscalls, regardless whether a transaction has being
bdc76f
    initiated before, GLIBS makes the kernel always save/restore HTM state
bdc76f
    (it can not even lazily disable it after a certain number of syscall
bdc76f
    iterations).
bdc76f
    
bdc76f
    Because of this shortcoming, Transactional Lock Elision is just enabled
bdc76f
    when it has been explicitly set (either by tunables of by a configure
bdc76f
    switch) and if kernel aborts HTM transactions on syscalls
bdc76f
    (PPC_FEATURE2_HTM_NOSC).  It is reported that using simple benchmark [1],
bdc76f
    the context-switch is about 5% faster by not issuing a tabort in every
bdc76f
    syscall in newer kernels.
bdc76f
    
bdc76f
    Checked on powerpc64le-linux-gnu with 4.4.0 kernel (Ubuntu 16.04).
bdc76f
    
bdc76f
    	* NEWS: Add note about new TLE support on powerpc64le.
bdc76f
    	* sysdeps/powerpc/nptl/tcb-offsets.sym (TM_CAPABLE): Remove.
bdc76f
    	* sysdeps/powerpc/nptl/tls.h (tcbhead_t): Rename tm_capable to
bdc76f
    	__ununsed1.
bdc76f
    	(TLS_INIT_TP, TLS_DEFINE_INIT_TP): Remove tm_capable setup.
bdc76f
    	(THREAD_GET_TM_CAPABLE, THREAD_SET_TM_CAPABLE): Remove macros.
bdc76f
    	* sysdeps/powerpc/powerpc32/sysdep.h,
bdc76f
    	sysdeps/powerpc/powerpc64/sysdep.h (ABORT_TRANSACTION_IMPL,
bdc76f
    	ABORT_TRANSACTION): Remove macros.
bdc76f
    	* sysdeps/powerpc/sysdep.h (ABORT_TRANSACTION): Likewise.
bdc76f
    	* sysdeps/unix/sysv/linux/powerpc/elision-conf.c (elision_init): Set
bdc76f
    	__pthread_force_elision iff PPC_FEATURE2_HTM_NOSC is set.
bdc76f
    	* sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep.h,
bdc76f
    	sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep.h
bdc76f
    	sysdeps/unix/sysv/linux/powerpc/syscall.S (ABORT_TRANSACTION): Remove
bdc76f
    	usage.
bdc76f
    	* sysdeps/unix/sysv/linux/powerpc/not-errno.h: Remove file.
bdc76f
    
bdc76f
    Reported-by: Breno Leitão <leitao@debian.org>
bdc76f
bdc76f
diff --git a/sysdeps/powerpc/nptl/tcb-offsets.sym b/sysdeps/powerpc/nptl/tcb-offsets.sym
bdc76f
index e5bb2b3..4c01615 100644
bdc76f
--- a/sysdeps/powerpc/nptl/tcb-offsets.sym
bdc76f
+++ b/sysdeps/powerpc/nptl/tcb-offsets.sym
bdc76f
@@ -21,7 +21,6 @@ DSO_SLOT2			(offsetof (tcbhead_t, dso_slot2) - TLS_TCB_OFFSET - sizeof (tcbhead_
bdc76f
 #ifdef __powerpc64__
bdc76f
 TCB_AT_PLATFORM			(offsetof (tcbhead_t, at_platform) - TLS_TCB_OFFSET - sizeof(tcbhead_t))
bdc76f
 #endif
bdc76f
-TM_CAPABLE			(offsetof (tcbhead_t, tm_capable) - TLS_TCB_OFFSET - sizeof (tcbhead_t))
bdc76f
 #ifndef __powerpc64__
bdc76f
 TCB_AT_PLATFORM			(offsetof (tcbhead_t, at_platform) - TLS_TCB_OFFSET - sizeof(tcbhead_t))
bdc76f
 PADDING				(offsetof (tcbhead_t, padding) - TLS_TCB_OFFSET - sizeof(tcbhead_t))
bdc76f
diff --git a/sysdeps/powerpc/nptl/tls.h b/sysdeps/powerpc/nptl/tls.h
bdc76f
index f88fed5..8317ca7 100644
bdc76f
--- a/sysdeps/powerpc/nptl/tls.h
bdc76f
+++ b/sysdeps/powerpc/nptl/tls.h
bdc76f
@@ -67,8 +67,7 @@ typedef struct
bdc76f
   uint32_t padding;
bdc76f
   uint32_t at_platform;
bdc76f
 #endif
bdc76f
-  /* Indicate if HTM capable (ISA 2.07).  */
bdc76f
-  uint32_t tm_capable;
bdc76f
+  uint32_t __unused;
bdc76f
   /* Reservation for AT_PLATFORM data - powerpc64.  */
bdc76f
 #ifdef __powerpc64__
bdc76f
   uint32_t at_platform;
bdc76f
@@ -142,7 +141,6 @@ register void *__thread_register __asm__ ("r13");
bdc76f
 # define TLS_INIT_TP(tcbp) \
bdc76f
   ({ 									      \
bdc76f
     __thread_register = (void *) (tcbp) + TLS_TCB_OFFSET;		      \
bdc76f
-    THREAD_SET_TM_CAPABLE (__tcb_hwcap & PPC_FEATURE2_HAS_HTM ? 1 : 0);	      \
bdc76f
     THREAD_SET_HWCAP (__tcb_hwcap);					      \
bdc76f
     THREAD_SET_AT_PLATFORM (__tcb_platform);				      \
bdc76f
     NULL;								      \
bdc76f
@@ -151,8 +149,6 @@ register void *__thread_register __asm__ ("r13");
bdc76f
 /* Value passed to 'clone' for initialization of the thread register.  */
bdc76f
 # define TLS_DEFINE_INIT_TP(tp, pd) \
bdc76f
     void *tp = (void *) (pd) + TLS_TCB_OFFSET + TLS_PRE_TCB_SIZE;	      \
bdc76f
-    (((tcbhead_t *) ((char *) tp - TLS_TCB_OFFSET))[-1].tm_capable) =	      \
bdc76f
-      THREAD_GET_TM_CAPABLE ();						      \
bdc76f
     (((tcbhead_t *) ((char *) tp - TLS_TCB_OFFSET))[-1].hwcap) =	      \
bdc76f
       THREAD_GET_HWCAP ();						      \
bdc76f
     (((tcbhead_t *) ((char *) tp - TLS_TCB_OFFSET))[-1].at_platform) =	      \
bdc76f
@@ -210,13 +206,6 @@ register void *__thread_register __asm__ ("r13");
bdc76f
 		     + TLS_PRE_TCB_SIZE))[-1].pointer_guard		      \
bdc76f
      = THREAD_GET_POINTER_GUARD())
bdc76f
 
bdc76f
-/* tm_capable field in TCB head.  */
bdc76f
-# define THREAD_GET_TM_CAPABLE() \
bdc76f
-    (((tcbhead_t *) ((char *) __thread_register				      \
bdc76f
-		     - TLS_TCB_OFFSET))[-1].tm_capable)
bdc76f
-# define THREAD_SET_TM_CAPABLE(value) \
bdc76f
-    (THREAD_GET_TM_CAPABLE () = (value))
bdc76f
-
bdc76f
 /* hwcap field in TCB head.  */
bdc76f
 # define THREAD_GET_HWCAP() \
bdc76f
     (((tcbhead_t *) ((char *) __thread_register				      \
bdc76f
diff --git a/sysdeps/powerpc/powerpc32/sysdep.h b/sysdeps/powerpc/powerpc32/sysdep.h
bdc76f
index 5f1294e..93097c5 100644
bdc76f
--- a/sysdeps/powerpc/powerpc32/sysdep.h
bdc76f
+++ b/sysdeps/powerpc/powerpc32/sysdep.h
bdc76f
@@ -90,24 +90,7 @@ GOT_LABEL:			;					      \
bdc76f
   cfi_endproc;								      \
bdc76f
   ASM_SIZE_DIRECTIVE(name)
bdc76f
 
bdc76f
-#if !IS_IN(rtld) && !defined(__SPE__)
bdc76f
-# define ABORT_TRANSACTION_IMPL \
bdc76f
-    cmpwi    2,0;		\
bdc76f
-    beq      1f;		\
bdc76f
-    lwz      0,TM_CAPABLE(2);	\
bdc76f
-    cmpwi    0,0;		\
bdc76f
-    beq	     1f;		\
bdc76f
-    li       11,_ABORT_SYSCALL;	\
bdc76f
-    tabort.  11;		\
bdc76f
-    .align 4;			\
bdc76f
-1:
bdc76f
-#else
bdc76f
-# define ABORT_TRANSACTION_IMPL
bdc76f
-#endif
bdc76f
-#define ABORT_TRANSACTION ABORT_TRANSACTION_IMPL
bdc76f
-
bdc76f
 #define DO_CALL(syscall)						      \
bdc76f
-    ABORT_TRANSACTION							      \
bdc76f
     li 0,syscall;							      \
bdc76f
     sc
bdc76f
 
bdc76f
diff --git a/sysdeps/powerpc/powerpc64/sysdep.h b/sysdeps/powerpc/powerpc64/sysdep.h
bdc76f
index 2df1d9b..50e64f9 100644
bdc76f
--- a/sysdeps/powerpc/powerpc64/sysdep.h
bdc76f
+++ b/sysdeps/powerpc/powerpc64/sysdep.h
bdc76f
@@ -263,24 +263,7 @@ LT_LABELSUFFIX(name,_name_end): ; \
bdc76f
   TRACEBACK_MASK(name,mask);	\
bdc76f
   END_2(name)
bdc76f
 
bdc76f
-#if !IS_IN(rtld)
bdc76f
-# define ABORT_TRANSACTION_IMPL \
bdc76f
-    cmpdi    13,0;		\
bdc76f
-    beq      1f;		\
bdc76f
-    lwz      0,TM_CAPABLE(13);	\
bdc76f
-    cmpwi    0,0;		\
bdc76f
-    beq	     1f;		\
bdc76f
-    li       11,_ABORT_SYSCALL;	\
bdc76f
-    tabort.  11;		\
bdc76f
-    .p2align 4;			\
bdc76f
-1:
bdc76f
-#else
bdc76f
-# define ABORT_TRANSACTION_IMPL
bdc76f
-#endif
bdc76f
-#define ABORT_TRANSACTION ABORT_TRANSACTION_IMPL
bdc76f
-
bdc76f
 #define DO_CALL(syscall) \
bdc76f
-    ABORT_TRANSACTION \
bdc76f
     li 0,syscall; \
bdc76f
     sc
bdc76f
 
bdc76f
diff --git a/sysdeps/powerpc/sysdep.h b/sysdeps/powerpc/sysdep.h
bdc76f
index 8a6d236..c8bf25e 100644
bdc76f
--- a/sysdeps/powerpc/sysdep.h
bdc76f
+++ b/sysdeps/powerpc/sysdep.h
bdc76f
@@ -21,8 +21,6 @@
bdc76f
  */
bdc76f
 #define _SYSDEPS_SYSDEP_H 1
bdc76f
 #include <bits/hwcap.h>
bdc76f
-#include <tls.h>
bdc76f
-#include <htm.h>
bdc76f
 
bdc76f
 #define PPC_FEATURE_970 (PPC_FEATURE_POWER4 + PPC_FEATURE_HAS_ALTIVEC)
bdc76f
 
bdc76f
@@ -166,22 +164,4 @@
bdc76f
 #define ALIGNARG(log2) log2
bdc76f
 #define ASM_SIZE_DIRECTIVE(name) .size name,.-name
bdc76f
 
bdc76f
-#else
bdc76f
-
bdc76f
-/* Linux kernel powerpc documentation [1] states issuing a syscall inside a
bdc76f
-   transaction is not recommended and may lead to undefined behavior.  It
bdc76f
-   also states syscalls do not abort transactions.  To avoid such traps,
bdc76f
-   we abort transaction just before syscalls.
bdc76f
-
bdc76f
-   [1] Documentation/powerpc/transactional_memory.txt [Syscalls]  */
bdc76f
-#if !IS_IN(rtld) && !defined(__SPE__)
bdc76f
-# define ABORT_TRANSACTION \
bdc76f
-  ({ 						\
bdc76f
-    if (THREAD_GET_TM_CAPABLE ())		\
bdc76f
-      __libc_tabort (_ABORT_SYSCALL);	\
bdc76f
-  })
bdc76f
-#else
bdc76f
-# define ABORT_TRANSACTION
bdc76f
-#endif
bdc76f
-
bdc76f
 #endif	/* __ASSEMBLER__ */
bdc76f
diff --git a/sysdeps/unix/sysv/linux/powerpc/elision-conf.c b/sysdeps/unix/sysv/linux/powerpc/elision-conf.c
bdc76f
index 906882a..fc82bd1 100644
bdc76f
--- a/sysdeps/unix/sysv/linux/powerpc/elision-conf.c
bdc76f
+++ b/sysdeps/unix/sysv/linux/powerpc/elision-conf.c
bdc76f
@@ -127,6 +127,26 @@ elision_init (int argc __attribute__ ((unused)),
bdc76f
 	       TUNABLE_CALLBACK (set_elision_skip_trylock_internal_abort));
bdc76f
 #endif
bdc76f
 
bdc76f
+  /* Linux from 3.9 through 4.2 do not abort HTM transaction on syscalls,
bdc76f
+     instead it suspends the transaction and resumes it when returning to
bdc76f
+     usercode.  The side-effects of the syscall will always remain visible,
bdc76f
+     even if the transaction is aborted.  This is an issue when a transaction
bdc76f
+     is used along with futex syscall, on pthread_cond_wait for instance,
bdc76f
+     where futex might succeed but the transaction is rolled back leading
bdc76f
+     the condition variable object in an inconsistent state.
bdc76f
+
bdc76f
+     Glibc used to prevent it by always aborting a transaction before issuing
bdc76f
+     a syscall.  Linux 4.2 also decided to abort active transaction in
bdc76f
+     syscalls which makes the glibc workaround superflours.  Worse, glibc
bdc76f
+     transaction abortions leads to a performance issues on recent kernels.
bdc76f
+
bdc76f
+     So Lock Elision is just enabled when it has been explict set (either
bdc76f
+     by tunables of by a configure switch) and if kernel aborts HTM
bdc76f
+     transactions on syscalls (PPC_FEATURE2_HTM_NOSC)  */
bdc76f
+
bdc76f
+  __pthread_force_elision = (__pthread_force_elision
bdc76f
+			     && GLRO (dl_hwcap2) & PPC_FEATURE2_HTM_NOSC);
bdc76f
+
bdc76f
   if (!__pthread_force_elision)
bdc76f
     __elision_aconf.try_tbegin = 0; /* Disable elision on rwlocks.  */
bdc76f
 }
bdc76f
diff --git a/sysdeps/unix/sysv/linux/powerpc/not-errno.h b/sysdeps/unix/sysv/linux/powerpc/not-errno.h
bdc76f
deleted file mode 100644
bdc76f
index 27da21b..0000000
bdc76f
--- a/sysdeps/unix/sysv/linux/powerpc/not-errno.h
bdc76f
+++ /dev/null
bdc76f
@@ -1,30 +0,0 @@
bdc76f
-/* Syscall wrapper that do not set errno.  Linux powerpc version.
bdc76f
-   Copyright (C) 2018 Free Software Foundation, Inc.
bdc76f
-   This file is part of the GNU C Library.
bdc76f
-
bdc76f
-   The GNU C Library is free software; you can redistribute it and/or
bdc76f
-   modify it under the terms of the GNU Lesser General Public
bdc76f
-   License as published by the Free Software Foundation; either
bdc76f
-   version 2.1 of the License, or (at your option) any later version.
bdc76f
-
bdc76f
-   The GNU C Library is distributed in the hope that it will be useful,
bdc76f
-   but WITHOUT ANY WARRANTY; without even the implied warranty of
bdc76f
-   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
bdc76f
-   Lesser General Public License for more details.
bdc76f
-
bdc76f
-   You should have received a copy of the GNU Lesser General Public
bdc76f
-   License along with the GNU C Library; if not, see
bdc76f
-   <http://www.gnu.org/licenses/>.  */
bdc76f
-
bdc76f
-/* __access_noerrno is used during process initialization in elf/dl-tunables.c
bdc76f
-   before the TCB is initialized, prohibiting the usage of
bdc76f
-   ABORT_TRANSACTION.  */
bdc76f
-#undef ABORT_TRANSACTION
bdc76f
-#define ABORT_TRANSACTION
bdc76f
-
bdc76f
-#include "sysdeps/unix/sysv/linux/not-errno.h"
bdc76f
-
bdc76f
-/* Recover ABORT_TRANSACTION's previous value, in order to not affect
bdc76f
-   other syscalls.  */
bdc76f
-#undef ABORT_TRANSACTION
bdc76f
-#define ABORT_TRANSACTION ABORT_TRANSACTION_IMPL
bdc76f
diff --git a/sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep.h b/sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep.h
bdc76f
index f7277d5..ec5c525 100644
bdc76f
--- a/sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep.h
bdc76f
+++ b/sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep.h
bdc76f
@@ -109,7 +109,6 @@
bdc76f
     register long int r11 __asm__ ("r11");				\
bdc76f
     register long int r12 __asm__ ("r12");				\
bdc76f
     LOADARGS_##nr(name, args);						\
bdc76f
-    ABORT_TRANSACTION;							\
bdc76f
     __asm__ __volatile__						\
bdc76f
       ("sc   \n\t"							\
bdc76f
        "mfcr %0"							\
bdc76f
diff --git a/sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep.h b/sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep.h
bdc76f
index 0956cf0..1f17f7b 100644
bdc76f
--- a/sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep.h
bdc76f
+++ b/sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep.h
bdc76f
@@ -131,7 +131,6 @@
bdc76f
     register long int r7  __asm__ ("r7");				\
bdc76f
     register long int r8  __asm__ ("r8");				\
bdc76f
     LOADARGS_##nr (name, ##args);					\
bdc76f
-    ABORT_TRANSACTION;							\
bdc76f
     __asm__ __volatile__						\
bdc76f
       ("sc\n\t"								\
bdc76f
        "mfcr  %0\n\t"							\
bdc76f
diff --git a/sysdeps/unix/sysv/linux/powerpc/syscall.S b/sysdeps/unix/sysv/linux/powerpc/syscall.S
bdc76f
index 2da9172..bbab613 100644
bdc76f
--- a/sysdeps/unix/sysv/linux/powerpc/syscall.S
bdc76f
+++ b/sysdeps/unix/sysv/linux/powerpc/syscall.S
bdc76f
@@ -18,7 +18,6 @@
bdc76f
 #include <sysdep.h>
bdc76f
 
bdc76f
 ENTRY (syscall)
bdc76f
-	ABORT_TRANSACTION
bdc76f
 	mr   r0,r3
bdc76f
 	mr   r3,r4
bdc76f
 	mr   r4,r5