b1dca6
commit 2dd8e58cc533ee840d37725b11bc0dc0308a5dc0
b1dca6
Author: H.J. Lu <hjl.tools@gmail.com>
b1dca6
Date:   Sun Oct 21 00:37:11 2018 -0700
b1dca6
b1dca6
    x86: Don't include <x86intrin.h>
b1dca6
    
b1dca6
    Use __builtin_ia32_rdtsc directly since including <x86intrin.h> makes
b1dca6
    building glibc very slow.  On Intel Core i5-6260U, this patch reduces
b1dca6
    x86-64 build time from 8 minutes 33 seconds to 3 minutes 48 seconds
b1dca6
    with "make -j4" and GCC 8.2.1.
b1dca6
    
b1dca6
            * sysdeps/x86/hp-timing.h: Don't include <x86intrin.h>.
b1dca6
            (HP_TIMING_NOW): Replace _rdtsc with __builtin_ia32_rdtsc.
b1dca6
b1dca6
diff --git a/sysdeps/x86/hp-timing.h b/sysdeps/x86/hp-timing.h
b1dca6
index 1c20e9d8289cc15b..77a1360748ca4535 100644
b1dca6
--- a/sysdeps/x86/hp-timing.h
b1dca6
+++ b/sysdeps/x86/hp-timing.h
b1dca6
@@ -22,8 +22,6 @@
b1dca6
 #include <isa.h>
b1dca6
 
b1dca6
 #if MINIMUM_ISA == 686 || MINIMUM_ISA == 8664
b1dca6
-# include <x86intrin.h>
b1dca6
-
b1dca6
 /* We always assume having the timestamp register.  */
b1dca6
 # define HP_TIMING_AVAIL	(1)
b1dca6
 # define HP_SMALL_TIMING_AVAIL	(1)
b1dca6
@@ -38,8 +36,11 @@ typedef unsigned long long int hp_timing_t;
b1dca6
    might not be 100% accurate since there might be some more instructions
b1dca6
    running in this moment.  This could be changed by using a barrier like
b1dca6
    'cpuid' right before the `rdtsc' instruciton.  But we are not interested
b1dca6
-   in accurate clock cycles here so we don't do this.  */
b1dca6
-# define HP_TIMING_NOW(Var)	((Var) = _rdtsc ())
b1dca6
+   in accurate clock cycles here so we don't do this.
b1dca6
+
b1dca6
+   NB: Use __builtin_ia32_rdtsc directly since including <x86intrin.h>
b1dca6
+   makes building glibc very slow.  */
b1dca6
+# define HP_TIMING_NOW(Var)	((Var) = __builtin_ia32_rdtsc ())
b1dca6
 
b1dca6
 # include <hp-timing-common.h>
b1dca6
 #else