|
|
00db10 |
commit 78b7adbaea643f2f213bb113e3ec933416a769a8
|
|
|
00db10 |
Author: Joseph Myers <joseph@codesourcery.com>
|
|
|
00db10 |
Date: Tue Oct 25 15:54:16 2016 +0000
|
|
|
00db10 |
|
|
|
00db10 |
Fix cmpli usage in power6 memset.
|
|
|
00db10 |
|
|
|
00db10 |
Building glibc for powerpc64 with recent (2.27.51.20161012) binutils,
|
|
|
00db10 |
with multi-arch enabled, I get the error:
|
|
|
00db10 |
|
|
|
00db10 |
../sysdeps/powerpc/powerpc64/power6/memset.S: Assembler messages:
|
|
|
00db10 |
../sysdeps/powerpc/powerpc64/power6/memset.S:254: Error: operand out of range (5 is not between 0 and 1)
|
|
|
00db10 |
../sysdeps/powerpc/powerpc64/power6/memset.S:254: Error: operand out of range (128 is not between 0 and 31)
|
|
|
00db10 |
../sysdeps/powerpc/powerpc64/power6/memset.S:254: Error: missing operand
|
|
|
00db10 |
|
|
|
00db10 |
Indeed, cmpli is documented as a four-operand instruction, and looking
|
|
|
00db10 |
at nearby code it seems likely cmpldi was intended. This patch fixes
|
|
|
00db10 |
this powerpc64 code accordingly, and makes a corresponding change to
|
|
|
00db10 |
the powerpc32 code.
|
|
|
00db10 |
|
|
|
00db10 |
Tested for powerpc, powerpc64 and powerpc64le by Tulio Magno Quites
|
|
|
00db10 |
Machado Filho
|
|
|
00db10 |
|
|
|
00db10 |
* sysdeps/powerpc/powerpc32/power6/memset.S (memset): Use cmplwi
|
|
|
00db10 |
instead of cmpli.
|
|
|
00db10 |
* sysdeps/powerpc/powerpc64/power6/memset.S (memset): Use cmpldi
|
|
|
00db10 |
instead of cmpli.
|
|
|
00db10 |
|
|
|
00db10 |
diff -rup a/sysdeps/powerpc/powerpc32/power6/memset.S b/sysdeps/powerpc/powerpc32/power6/memset.S
|
|
|
00db10 |
--- a/sysdeps/powerpc/powerpc32/power6/memset.S 2017-03-06 13:52:27.000000000 -0500
|
|
|
00db10 |
+++ b/sysdeps/powerpc/powerpc32/power6/memset.S 2017-03-06 13:54:49.705201476 -0500
|
|
|
00db10 |
@@ -396,7 +396,7 @@ L(cacheAlignedx):
|
|
|
00db10 |
/* A simple loop for the longer (>640 bytes) lengths. This form limits
|
|
|
00db10 |
the branch miss-predicted to exactly 1 at loop exit.*/
|
|
|
00db10 |
L(cacheAligned512):
|
|
|
00db10 |
- cmpli cr1,rLEN,128
|
|
|
00db10 |
+ cmplwi cr1,rLEN,128
|
|
|
00db10 |
blt cr1,L(cacheAligned1)
|
|
|
00db10 |
dcbz 0,rMEMP
|
|
|
00db10 |
addi rLEN,rLEN,-128
|
|
|
00db10 |
diff -rup a/sysdeps/powerpc/powerpc64/power6/memset.S b/sysdeps/powerpc/powerpc64/power6/memset.S
|
|
|
00db10 |
--- a/sysdeps/powerpc/powerpc64/power6/memset.S 2017-03-06 13:52:22.000000000 -0500
|
|
|
00db10 |
+++ b/sysdeps/powerpc/powerpc64/power6/memset.S 2017-03-06 13:54:35.824216755 -0500
|
|
|
00db10 |
@@ -269,7 +269,7 @@ L(cacheAlignedx):
|
|
|
00db10 |
/* A simple loop for the longer (>640 bytes) lengths. This form limits
|
|
|
00db10 |
the branch miss-predicted to exactly 1 at loop exit.*/
|
|
|
00db10 |
L(cacheAligned512):
|
|
|
00db10 |
- cmpli cr1,rLEN,128
|
|
|
00db10 |
+ cmpldi cr1,rLEN,128
|
|
|
00db10 |
blt cr1,L(cacheAligned1)
|
|
|
00db10 |
dcbz 0,rMEMP
|
|
|
00db10 |
addi rLEN,rLEN,-128
|