Blame SOURCES/valgrind-3.14.0-transform-popcount64-ctznat64.patch

cb589a
commit cb5d7e047598bff6d0f1d707a70d9fb1a1c7f0e2
cb589a
Author: Julian Seward <jseward@acm.org>
cb589a
Date:   Tue Nov 20 11:46:55 2018 +0100
cb589a
cb589a
    VEX/priv/ir_opt.c
cb589a
    
cb589a
    fold_Expr: transform PopCount64(And64(Add64(x,-1),Not64(x))) into CtzNat64(x).
cb589a
    
cb589a
    This is part of the fix for bug 386945.
cb589a
cb589a
diff --git a/VEX/priv/ir_opt.c b/VEX/priv/ir_opt.c
cb589a
index f40870b..23964be 100644
cb589a
--- a/VEX/priv/ir_opt.c
cb589a
+++ b/VEX/priv/ir_opt.c
cb589a
@@ -1377,6 +1377,8 @@ static IRExpr* fold_Expr ( IRExpr** env, IRExpr* e )
cb589a
    case Iex_Unop:
cb589a
       /* UNARY ops */
cb589a
       if (e->Iex.Unop.arg->tag == Iex_Const) {
cb589a
+
cb589a
+         /* cases where the arg is a const */
cb589a
          switch (e->Iex.Unop.op) {
cb589a
          case Iop_1Uto8:
cb589a
             e2 = IRExpr_Const(IRConst_U8(toUChar(
cb589a
@@ -1690,8 +1692,56 @@ static IRExpr* fold_Expr ( IRExpr** env, IRExpr* e )
cb589a
 
cb589a
          default: 
cb589a
             goto unhandled;
cb589a
-      }
cb589a
-      }
cb589a
+         } // switch (e->Iex.Unop.op)
cb589a
+
cb589a
+      } else {
cb589a
+
cb589a
+         /* other cases (identities, etc) */
cb589a
+         switch (e->Iex.Unop.op) {
cb589a
+         case Iop_PopCount64: {
cb589a
+            // PopCount64( And64( Add64(x,-1), Not64(x) ) ) ==> CtzNat64(x)
cb589a
+            // bindings:
cb589a
+            //   a1:And64( a11:Add64(a111:x,a112:-1), a12:Not64(a121:x) )
cb589a
+            IRExpr* a1 = chase(env, e->Iex.Unop.arg);
cb589a
+            if (!a1)
cb589a
+               goto nomatch;
cb589a
+            if (a1->tag != Iex_Binop || a1->Iex.Binop.op != Iop_And64)
cb589a
+               goto nomatch;
cb589a
+            // a1 is established
cb589a
+            IRExpr* a11 = chase(env, a1->Iex.Binop.arg1);
cb589a
+            if (!a11)
cb589a
+               goto nomatch;
cb589a
+            if (a11->tag != Iex_Binop || a11->Iex.Binop.op != Iop_Add64)
cb589a
+               goto nomatch;
cb589a
+            // a11 is established
cb589a
+            IRExpr* a12 = chase(env, a1->Iex.Binop.arg2);
cb589a
+            if (!a12)
cb589a
+               goto nomatch;
cb589a
+            if (a12->tag != Iex_Unop || a12->Iex.Unop.op != Iop_Not64)
cb589a
+               goto nomatch;
cb589a
+            // a12 is established
cb589a
+            IRExpr* a111 = a11->Iex.Binop.arg1;
cb589a
+            IRExpr* a112 = chase(env, a11->Iex.Binop.arg2);
cb589a
+            IRExpr* a121 = a12->Iex.Unop.arg;
cb589a
+            if (!a111 || !a112 || !a121)
cb589a
+               goto nomatch;
cb589a
+            // a111 and a121 need to be the same temp.
cb589a
+            if (!eqIRAtom(a111, a121))
cb589a
+               goto nomatch;
cb589a
+            // Finally, a112 must be a 64-bit version of -1.
cb589a
+            if (!isOnesU(a112))
cb589a
+               goto nomatch;
cb589a
+            // Match established.  Transform.
cb589a
+            e2 = IRExpr_Unop(Iop_CtzNat64, a111);
cb589a
+            break;
cb589a
+           nomatch:
cb589a
+            break;
cb589a
+         }
cb589a
+         default:
cb589a
+            break;
cb589a
+         } // switch (e->Iex.Unop.op)
cb589a
+
cb589a
+      } // if (e->Iex.Unop.arg->tag == Iex_Const)
cb589a
       break;
cb589a
 
cb589a
    case Iex_Binop: