00db10
From 1ae5597025b342ee8fec59e04970b44fc1361744 Mon Sep 17 00:00:00 2001
00db10
From: Stefan Liebler <stli@linux.vnet.ibm.com>
00db10
Date: Mon, 7 Nov 2016 17:17:51 +0100
00db10
Subject: [PATCH 14/17] S390: Fix utf32 to utf8 handling of low surrogates
00db10
 (disable cu41).
00db10
00db10
Upstream commit 52f8a48e24563daa807f94824ce9782b9a9eece9
00db10
00db10
According to the latest Unicode standard, a conversion from/to UTF-xx has
00db10
to report an error if the character value is in range of an utf16 surrogate
00db10
(0xd800..0xdfff). See https://sourceware.org/ml/libc-help/2015-12/msg00015.html.
00db10
00db10
Thus the cu41 instruction, which converts from utf32 to utf8,  has to be
00db10
disabled because it does not report an error in case of a value in range of
00db10
a low surrogate (0xdc00..0xdfff). The etf3eh variant is removed and the c,
00db10
vector variant is adjusted to handle the value in range of an utf16 low
00db10
surrogate correctly.
00db10
00db10
ChangeLog:
00db10
00db10
	* sysdeps/s390/utf8-utf32-z9.c: Disable cu41 instruction and report
00db10
	an error in case of a value in range of an utf16 low surrogate.
00db10
---
00db10
 sysdeps/s390/utf8-utf32-z9.c | 188 ++++++++++++++++++++++++++-----------------
00db10
 1 file changed, 115 insertions(+), 73 deletions(-)
00db10
00db10
diff --git a/sysdeps/s390/utf8-utf32-z9.c b/sysdeps/s390/utf8-utf32-z9.c
00db10
index e39e0a7..efae745 100644
00db10
--- a/sysdeps/s390/utf8-utf32-z9.c
00db10
+++ b/sysdeps/s390/utf8-utf32-z9.c
00db10
@@ -572,28 +572,6 @@ __from_utf8_loop_resolver (unsigned long int dl_hwcap)
00db10
 
00db10
 strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 
00db10
-
00db10
-/* Conversion from UTF-32 internal/BE to UTF-8.  */
00db10
-#define BODY_TO_HW(ASM)							\
00db10
-  {									\
00db10
-    ASM;								\
00db10
-    if (__glibc_likely (inptr == inend)					\
00db10
-	|| result == __GCONV_FULL_OUTPUT)				\
00db10
-      break;								\
00db10
-    if (inptr + 4 > inend)						\
00db10
-      {									\
00db10
-	result = __GCONV_INCOMPLETE_INPUT;				\
00db10
-	break;								\
00db10
-      }									\
00db10
-    STANDARD_TO_LOOP_ERR_HANDLER (4);					\
00db10
-  }
00db10
-
00db10
-/* The hardware routine uses the S/390 cu41 instruction.  */
00db10
-#define BODY_TO_ETF3EH BODY_TO_HW (HARDWARE_CONVERT ("cu41 %0, %1"))
00db10
-
00db10
-/* The hardware routine uses the S/390 vector and cu41 instructions.  */
00db10
-#define BODY_TO_VX BODY_TO_HW (HW_TO_VX)
00db10
-
00db10
 /* The software routine mimics the S/390 cu41 instruction.  */
00db10
 #define BODY_TO_C						\
00db10
   {								\
00db10
@@ -632,7 +610,7 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 	    result = __GCONV_FULL_OUTPUT;			\
00db10
 	    break;						\
00db10
 	  }							\
00db10
-	if (wc >= 0xd800 && wc < 0xdc00)			\
00db10
+	if (wc >= 0xd800 && wc <= 0xdfff)			\
00db10
 	  {							\
00db10
 	    /* Do not accept UTF-16 surrogates.   */		\
00db10
 	    result = __GCONV_ILLEGAL_INPUT;			\
00db10
@@ -679,13 +657,12 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
     inptr += 4;							\
00db10
   }
00db10
 
00db10
-#define HW_TO_VX							\
00db10
+/* The hardware routine uses the S/390 vector instructions.  */
00db10
+#define BODY_TO_VX							\
00db10
   {									\
00db10
-    register const unsigned char* pInput asm ("8") = inptr;		\
00db10
-    register size_t inlen asm ("9") = inend - inptr;			\
00db10
-    register unsigned char* pOutput asm ("10") = outptr;		\
00db10
-    register size_t outlen asm("11") = outend - outptr;			\
00db10
-    unsigned long tmp, tmp2;						\
00db10
+    size_t inlen = inend - inptr;					\
00db10
+    size_t outlen = outend - outptr;					\
00db10
+    unsigned long tmp, tmp2, tmp3;					\
00db10
     asm volatile (".machine push\n\t"					\
00db10
 		  ".machine \"z13\"\n\t"				\
00db10
 		  ".machinemode \"zarch_nohighgprs\"\n\t"		\
00db10
@@ -696,10 +673,10 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 		  CONVERT_32BIT_SIZE_T ([R_INLEN])			\
00db10
 		  CONVERT_32BIT_SIZE_T ([R_OUTLEN])			\
00db10
 		  /* Loop which handles UTF-32 chars <=0x7f.  */	\
00db10
-		  "0:  clgijl %[R_INLEN],64,20f\n\t"			\
00db10
-		  "    clgijl %[R_OUTLEN],16,20f\n\t"			\
00db10
+		  "0:  clgijl %[R_INLEN],64,2f\n\t"			\
00db10
+		  "    clgijl %[R_OUTLEN],16,2f\n\t"			\
00db10
 		  "1:  vlm %%v16,%%v19,0(%[R_IN])\n\t"			\
00db10
-		  "    lghi %[R_TMP],0\n\t"				\
00db10
+		  "    lghi %[R_TMP2],0\n\t"				\
00db10
 		  /* Shorten to byte values.  */			\
00db10
 		  "    vpkf %%v23,%%v16,%%v17\n\t"			\
00db10
 		  "    vpkf %%v24,%%v18,%%v19\n\t"			\
00db10
@@ -719,41 +696,116 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 		  "    aghi %[R_OUTLEN],-16\n\t"			\
00db10
 		  "    la %[R_IN],64(%[R_IN])\n\t"			\
00db10
 		  "    la %[R_OUT],16(%[R_OUT])\n\t"			\
00db10
-		  "    clgijl %[R_INLEN],64,20f\n\t"			\
00db10
-		  "    clgijl %[R_OUTLEN],16,20f\n\t"			\
00db10
+		  "    clgijl %[R_INLEN],64,2f\n\t"			\
00db10
+		  "    clgijl %[R_OUTLEN],16,2f\n\t"			\
00db10
 		  "    j 1b\n\t"					\
00db10
 		  /* Found a value > 0x7f.  */				\
00db10
-		  "13: ahi %[R_TMP],4\n\t"				\
00db10
-		  "12: ahi %[R_TMP],4\n\t"				\
00db10
-		  "11: ahi %[R_TMP],4\n\t"				\
00db10
-		  "10: vlgvb %[R_I],%%v22,7\n\t"			\
00db10
-		  "    srlg %[R_I],%[R_I],2\n\t"			\
00db10
-		  "    agr %[R_I],%[R_TMP]\n\t"				\
00db10
-		  "    je 20f\n\t"					\
00db10
+		  "13: ahi %[R_TMP2],4\n\t"				\
00db10
+		  "12: ahi %[R_TMP2],4\n\t"				\
00db10
+		  "11: ahi %[R_TMP2],4\n\t"				\
00db10
+		  "10: vlgvb %[R_TMP],%%v22,7\n\t"			\
00db10
+		  "    srlg %[R_TMP],%[R_TMP],2\n\t"			\
00db10
+		  "    agr %[R_TMP],%[R_TMP2]\n\t"			\
00db10
+		  "    je 16f\n\t"					\
00db10
 		  /* Store characters before invalid one...  */		\
00db10
-		  "    slgr %[R_OUTLEN],%[R_I]\n\t"			\
00db10
-		  "15: aghi %[R_I],-1\n\t"				\
00db10
-		  "    vstl %%v23,%[R_I],0(%[R_OUT])\n\t"		\
00db10
+		  "    slgr %[R_OUTLEN],%[R_TMP]\n\t"			\
00db10
+		  "15: aghi %[R_TMP],-1\n\t"				\
00db10
+		  "    vstl %%v23,%[R_TMP],0(%[R_OUT])\n\t"		\
00db10
 		  /* ... and update pointers.  */			\
00db10
-		  "    aghi %[R_I],1\n\t"				\
00db10
-		  "    la %[R_OUT],0(%[R_I],%[R_OUT])\n\t"		\
00db10
-		  "    sllg %[R_I],%[R_I],2\n\t"			\
00db10
-		  "    la %[R_IN],0(%[R_I],%[R_IN])\n\t"		\
00db10
-		  "    slgr %[R_INLEN],%[R_I]\n\t"			\
00db10
-		  /* Handle multibyte utf8-char with convert instruction. */ \
00db10
-		  "20: cu41 %[R_OUT],%[R_IN]\n\t"			\
00db10
-		  "    jo 0b\n\t" /* Try vector implemenation again.  */ \
00db10
-		  "    lochil %[R_RES],%[RES_OUT_FULL]\n\t" /* cc == 1.  */ \
00db10
-		  "    lochih %[R_RES],%[RES_IN_ILL]\n\t" /* cc == 2.  */ \
00db10
+		  "    aghi %[R_TMP],1\n\t"				\
00db10
+		  "    la %[R_OUT],0(%[R_TMP],%[R_OUT])\n\t"		\
00db10
+		  "    sllg %[R_TMP2],%[R_TMP],2\n\t"			\
00db10
+		  "    la %[R_IN],0(%[R_TMP2],%[R_IN])\n\t"		\
00db10
+		  "    slgr %[R_INLEN],%[R_TMP2]\n\t"			\
00db10
+		  /* Calculate remaining uint32_t values in loaded vrs.  */ \
00db10
+		  "16: lghi %[R_TMP2],16\n\t"				\
00db10
+		  "    sgr %[R_TMP2],%[R_TMP]\n\t"			\
00db10
+		  "    l %[R_TMP],0(%[R_IN])\n\t"			\
00db10
+		  "    aghi %[R_INLEN],-4\n\t"				\
00db10
+		  "    j 22f\n\t"					\
00db10
+		  /* Handle remaining bytes.  */			\
00db10
+		  "2:  clgije %[R_INLEN],0,99f\n\t"			\
00db10
+		  "    clgijl %[R_INLEN],4,92f\n\t"			\
00db10
+		  /* Calculate remaining uint32_t values in inptr.  */	\
00db10
+		  "    srlg %[R_TMP2],%[R_INLEN],2\n\t"			\
00db10
+		  /* Handle multibyte utf8-char. */			\
00db10
+		  "20: l %[R_TMP],0(%[R_IN])\n\t"			\
00db10
+		  "    aghi %[R_INLEN],-4\n\t"				\
00db10
+		  /* Test if ch is 1byte UTF-8 char. */			\
00db10
+		  "21: clijh %[R_TMP],0x7f,22f\n\t"			\
00db10
+		  /* Handle 1-byte UTF-8 char.  */			\
00db10
+		  "31: slgfi %[R_OUTLEN],1\n\t"				\
00db10
+		  "    jl 90f \n\t"					\
00db10
+		  "    stc %[R_TMP],0(%[R_OUT])\n\t"			\
00db10
+		  "    la %[R_IN],4(%[R_IN])\n\t"			\
00db10
+		  "    la %[R_OUT],1(%[R_OUT])\n\t"			\
00db10
+		  "    brctg %[R_TMP2],20b\n\t"				\
00db10
+		  "    j 0b\n\t" /* Switch to vx-loop.  */		\
00db10
+		  /* Test if ch is 2byte UTF-8 char. */			\
00db10
+		  "22: clfi %[R_TMP],0x7ff\n\t"				\
00db10
+		  "    jh 23f\n\t"					\
00db10
+		  /* Handle 2-byte UTF-8 char.  */			\
00db10
+		  "32: slgfi %[R_OUTLEN],2\n\t"				\
00db10
+		  "    jl 90f \n\t"					\
00db10
+		  "    llill %[R_TMP3],0xc080\n\t"			\
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],51,55,2\n\t" /* 1. byte.   */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],58,63,0\n\t" /* 2. byte.   */ \
00db10
+		  "    sth %[R_TMP3],0(%[R_OUT])\n\t"			\
00db10
+		  "    la %[R_IN],4(%[R_IN])\n\t"			\
00db10
+		  "    la %[R_OUT],2(%[R_OUT])\n\t"			\
00db10
+		  "    brctg %[R_TMP2],20b\n\t"				\
00db10
+		  "    j 0b\n\t" /* Switch to vx-loop.  */		\
00db10
+		  /* Test if ch is 3-byte UTF-8 char.  */		\
00db10
+		  "23: clfi %[R_TMP],0xffff\n\t"			\
00db10
+		  "    jh 24f\n\t"					\
00db10
+		  /* Handle 3-byte UTF-8 char.  */			\
00db10
+		  "33: slgfi %[R_OUTLEN],3\n\t"				\
00db10
+		  "    jl 90f \n\t"					\
00db10
+		  "    llilf %[R_TMP3],0xe08080\n\t"			\
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],44,47,4\n\t" /* 1. byte.  */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],50,55,2\n\t" /* 2. byte.  */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],58,63,0\n\t" /* 3. byte.  */ \
00db10
+		  /* Test if ch is a UTF-16 surrogate: ch & 0xf800 == 0xd800  */ \
00db10
+		  "    nilf %[R_TMP],0xf800\n\t"			\
00db10
+		  "    clfi %[R_TMP],0xd800\n\t"			\
00db10
+		  "    je 91f\n\t" /* Do not accept UTF-16 surrogates.  */ \
00db10
+		  "    stcm %[R_TMP3],7,0(%[R_OUT])\n\t"		\
00db10
+		  "    la %[R_IN],4(%[R_IN])\n\t"			\
00db10
+		  "    la %[R_OUT],3(%[R_OUT])\n\t"			\
00db10
+		  "    brctg %[R_TMP2],20b\n\t"				\
00db10
+		  "    j 0b\n\t" /* Switch to vx-loop.  */		\
00db10
+		  /* Test if ch is 4-byte UTF-8 char.  */		\
00db10
+		  "24: clfi %[R_TMP],0x10ffff\n\t"			\
00db10
+		  "    jh 91f\n\t" /* ch > 0x10ffff is not allowed!  */	\
00db10
+		  /* Handle 4-byte UTF-8 char.  */			\
00db10
+		  "34: slgfi %[R_OUTLEN],4\n\t"				\
00db10
+		  "    jl 90f \n\t"					\
00db10
+		  "    llilf %[R_TMP3],0xf0808080\n\t"			\
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],37,39,6\n\t" /* 1. byte.  */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],42,47,4\n\t" /* 2. byte.  */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],50,55,2\n\t" /* 3. byte.  */ \
00db10
+		  "    risbgn %[R_TMP3],%[R_TMP],58,63,0\n\t" /* 4. byte.  */ \
00db10
+		  "    st %[R_TMP3],0(%[R_OUT])\n\t"			\
00db10
+		  "    la %[R_IN],4(%[R_IN])\n\t"			\
00db10
+		  "    la %[R_OUT],4(%[R_OUT])\n\t"			\
00db10
+		  "    brctg %[R_TMP2],20b\n\t"				\
00db10
+		  "    j 0b\n\t" /* Switch to vx-loop.  */		\
00db10
+		  "92: lghi %[R_RES],%[RES_IN_FULL]\n\t"		\
00db10
+		  "    j 99f\n\t"					\
00db10
+		  "91: lghi %[R_RES],%[RES_IN_ILL]\n\t"			\
00db10
+		  "    j 99f\n\t"					\
00db10
+		  "90: lghi %[R_RES],%[RES_OUT_FULL]\n\t"		\
00db10
+		  "99: \n\t"						\
00db10
 		  ".machine pop"					\
00db10
-		  : /* outputs */ [R_IN] "+a" (pInput)			\
00db10
-		    , [R_INLEN] "+d" (inlen), [R_OUT] "+a" (pOutput)	\
00db10
-		    , [R_OUTLEN] "+d" (outlen), [R_TMP] "=d" (tmp)	\
00db10
-		    , [R_I] "=a" (tmp2)					\
00db10
+		  : /* outputs */ [R_IN] "+a" (inptr)			\
00db10
+		    , [R_INLEN] "+d" (inlen), [R_OUT] "+a" (outptr)	\
00db10
+		    , [R_OUTLEN] "+d" (outlen), [R_TMP] "=a" (tmp)	\
00db10
+		    , [R_TMP2] "=a" (tmp2), [R_TMP3] "=d" (tmp3)	\
00db10
 		    , [R_RES] "+d" (result)				\
00db10
 		  : /* inputs */					\
00db10
 		    [RES_OUT_FULL] "i" (__GCONV_FULL_OUTPUT)		\
00db10
 		    , [RES_IN_ILL] "i" (__GCONV_ILLEGAL_INPUT)		\
00db10
+		    , [RES_IN_FULL] "i" (__GCONV_INCOMPLETE_INPUT)	\
00db10
 		  : /* clobber list */ "memory", "cc"			\
00db10
 		    ASM_CLOBBER_VR ("v16") ASM_CLOBBER_VR ("v17")	\
00db10
 		    ASM_CLOBBER_VR ("v18") ASM_CLOBBER_VR ("v19")	\
00db10
@@ -761,8 +813,11 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 		    ASM_CLOBBER_VR ("v22") ASM_CLOBBER_VR ("v23")	\
00db10
 		    ASM_CLOBBER_VR ("v24")				\
00db10
 		  );							\
00db10
-    inptr = pInput;							\
00db10
-    outptr = pOutput;							\
00db10
+    if (__glibc_likely (inptr == inend)					\
00db10
+	|| result != __GCONV_ILLEGAL_INPUT)				\
00db10
+      break;								\
00db10
+									\
00db10
+    STANDARD_TO_LOOP_ERR_HANDLER (4);					\
00db10
   }
00db10
 
00db10
 /* Generate loop-function with software routing.  */
00db10
@@ -774,15 +829,6 @@ strong_alias (__from_utf8_loop_c_single, __from_utf8_loop_single)
00db10
 #define LOOP_NEED_FLAGS
00db10
 #include <iconv/loop.c>
00db10
 
00db10
-/* Generate loop-function with hardware utf-convert instruction.  */
00db10
-#define MIN_NEEDED_INPUT	MIN_NEEDED_TO
00db10
-#define MIN_NEEDED_OUTPUT	MIN_NEEDED_FROM
00db10
-#define MAX_NEEDED_OUTPUT	MAX_NEEDED_FROM
00db10
-#define LOOPFCT			__to_utf8_loop_etf3eh
00db10
-#define LOOP_NEED_FLAGS
00db10
-#define BODY			BODY_TO_ETF3EH
00db10
-#include <iconv/loop.c>
00db10
-
00db10
 #if defined HAVE_S390_VX_ASM_SUPPORT
00db10
 /* Generate loop-function with hardware vector and utf-convert instructions.  */
00db10
 # define MIN_NEEDED_INPUT	MIN_NEEDED_TO
00db10
@@ -807,10 +853,6 @@ __to_utf8_loop_resolver (unsigned long int dl_hwcap)
00db10
     return __to_utf8_loop_vx;
00db10
   else
00db10
 #endif
00db10
-  if (dl_hwcap & HWCAP_S390_ZARCH && dl_hwcap & HWCAP_S390_HIGH_GPRS
00db10
-      && dl_hwcap & HWCAP_S390_ETF3EH)
00db10
-    return __to_utf8_loop_etf3eh;
00db10
-  else
00db10
     return __to_utf8_loop_c;
00db10
 }
00db10
 
00db10
-- 
00db10
1.8.3.1
00db10