Add IR ops Iop_CmpNEZ32x8 and Iop_CmpNEZ64x4, needed for Memcheck

author Julian Seward <jseward@acm.org>

Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)

committer Julian Seward <jseward@acm.org>

Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)
author Julian Seward <jseward@acm.org>
Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)
committer Julian Seward <jseward@acm.org>
Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)
diff --git a/VEX/priv/host_amd64_isel.c b/VEX/priv/host_amd64_isel.c

index 86eb2d8a205bbd4c779645b6b1398a6414e0d634..46d267021168fcb13d86f5caefa9a82a31a077b6 100644 (file)
--- a/VEX/priv/host_amd64_isel.c
+++ b/VEX/priv/host_amd64_isel.c
@@ -3474,6 +3474,51 @@ static void iselDVecExpr_wrk ( /*OUT*/HReg* rHi, /*OUT*/HReg* rLo,
           return;
        }
  
+      case Iop_CmpNEZ64x4: {
+         /* We can use SSE2 instructions for this. */
+         /* Same scheme as Iop_CmpNEZ64x2, except twice as wide
+            (obviously).  See comment on Iop_CmpNEZ64x2 for
+            explanation of what's going on here. */
+         HReg argHi, argLo;
+         iselDVecExpr(&argHi, &argLo, env, e->Iex.Unop.arg);
+         HReg tmpHi  = generate_zeroes_V128(env);
+         HReg tmpLo  = newVRegV(env);
+         addInstr(env, mk_vMOVsd_RR(tmpHi, tmpLo));
+         HReg dstHi  = newVRegV(env);
+         HReg dstLo  = newVRegV(env);
+         addInstr(env, AMD64Instr_SseReRg(Asse_CMPEQ32, argHi, tmpHi));
+         addInstr(env, AMD64Instr_SseReRg(Asse_CMPEQ32, argLo, tmpLo));
+         tmpHi = do_sse_NotV128(env, tmpHi);
+         tmpLo = do_sse_NotV128(env, tmpLo);
+         addInstr(env, AMD64Instr_SseShuf(0xB1, tmpHi, dstHi));
+         addInstr(env, AMD64Instr_SseShuf(0xB1, tmpLo, dstLo));
+         addInstr(env, AMD64Instr_SseReRg(Asse_OR, tmpHi, dstHi));
+         addInstr(env, AMD64Instr_SseReRg(Asse_OR, tmpLo, dstLo));
+         *rHi = dstHi;
+         *rLo = dstLo;
+         return;
+      }
+
+      case Iop_CmpNEZ32x8: op = Asse_CMPEQ32; goto do_CmpNEZ_vector;
+      do_CmpNEZ_vector:
+      {
+         HReg argHi, argLo;
+         iselDVecExpr(&argHi, &argLo, env, e->Iex.Unop.arg);
+         HReg tmpHi = newVRegV(env);
+         HReg tmpLo = newVRegV(env);
+         HReg zero  = generate_zeroes_V128(env);
+         HReg dstHi, dstLo;
+         addInstr(env, mk_vMOVsd_RR(argHi, tmpHi));
+         addInstr(env, mk_vMOVsd_RR(argLo, tmpLo));
+         addInstr(env, AMD64Instr_SseReRg(op, zero, tmpHi));
+         addInstr(env, AMD64Instr_SseReRg(op, zero, tmpLo));
+         dstHi = do_sse_NotV128(env, tmpHi);
+         dstLo = do_sse_NotV128(env, tmpLo);
+         *rHi = dstHi;
+         *rLo = dstLo;
+         return;
+      }
+
        default:
           break;
     } /* switch (e->Iex.Unop.op) */
diff --git a/VEX/priv/ir_defs.c b/VEX/priv/ir_defs.c

index 71a8e27525fdf109987c0b647837acc68808d417..5d3b8b7ebb70ad59dbbbc3782810bb9af41eae2e 100644 (file)
--- a/VEX/priv/ir_defs.c
+++ b/VEX/priv/ir_defs.c
@@ -1008,6 +1008,8 @@ void ppIROp ( IROp op )
        case Iop_OrV256:  vex_printf("OrV256"); return;
        case Iop_XorV256: vex_printf("XorV256"); return;
        case Iop_NotV256: vex_printf("NotV256"); return;
+      case Iop_CmpNEZ64x4: vex_printf("CmpNEZ64x4"); return;
+      case Iop_CmpNEZ32x8: vex_printf("CmpNEZ32x8"); return;
        default: vpanic("ppIROp(1)");
     }
  
@@ -2828,6 +2830,7 @@ void typeOfPrimop ( IROp op,
        case Iop_Sqrt32Fx8:
        case Iop_Sqrt64Fx4:
        case Iop_Recip32Fx8:
+      case Iop_CmpNEZ64x4: case Iop_CmpNEZ32x8:
           UNARY(Ity_V256, Ity_V256);
  
        default:
diff --git a/VEX/pub/libvex_ir.h b/VEX/pub/libvex_ir.h

index acac2c347c20a71fc1e720c7df0f76f589c1ddf9..7aaef1e5eb73154b678af2ed47ab933dec4202cd 100644 (file)
--- a/VEX/pub/libvex_ir.h
+++ b/VEX/pub/libvex_ir.h
@@ -1441,6 +1441,9 @@ typedef
        Iop_XorV256,
        Iop_NotV256,
  
+      /* MISC (vector integer cmp != 0) */
+      Iop_CmpNEZ32x8, Iop_CmpNEZ64x4,
+
        /* ------------------ 256-bit SIMD FP. ------------------ */
        Iop_Add64Fx4,
        Iop_Sub64Fx4,
author	Julian Seward <jseward@acm.org>
	Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)
committer	Julian Seward <jseward@acm.org>
	Mon, 25 Jun 2012 07:46:18 +0000 (07:46 +0000)
VEX/priv/host_amd64_isel.c		patch \| blob \| blame \| history
VEX/priv/ir_defs.c		patch \| blob \| blame \| history
VEX/pub/libvex_ir.h		patch \| blob \| blame \| history