Implement VRINT{A,N,P,M}.F64 d_d, VRINT{A,N,P,M}.F32 s_s.

author Julian Seward <jseward@acm.org>

Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)

committer Julian Seward <jseward@acm.org>

Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)
author Julian Seward <jseward@acm.org>
Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)
committer Julian Seward <jseward@acm.org>
Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)
diff --git a/VEX/priv/guest_arm_toIR.c b/VEX/priv/guest_arm_toIR.c

index b5458d2b0617c975d98cd0b9f8778be89b56abc2..42c648b5488a708207fb8318ac12a656d2dc685d 100644 (file)
--- a/VEX/priv/guest_arm_toIR.c
+++ b/VEX/priv/guest_arm_toIR.c
@@ -13510,6 +13510,59 @@ static Bool decode_V8_instruction (
     }
     /* fall through */
  
+   /* -------- VRINT{A,N,P,M}.F64 d_d, VRINT{A,N,P,M}.F32 s_s -------- */
+   /*        31        22 21   17 15 11  8 7  5 4 3
+      T1/A1: 111111101 D  1110 rm Vd 101 1 01 M 0 Vm VRINT{A,N,P,M}.F64 Dd, Dm
+      T1/A1: 111111101 D  1110 rm Vd 101 0 01 M 0 Vm VRINT{A,N,P,M}.F32 Sd, Sm
+
+      ARM encoding is in NV space.
+      In Thumb mode, we must not be in an IT block.
+   */
+   if (INSN(31,23) == BITS9(1,1,1,1,1,1,1,0,1)
+       && INSN(21,18) == BITS4(1,1,1,0) && INSN(11,9) == BITS3(1,0,1)
+       && INSN(7,6) == BITS2(0,1) && INSN(4,4) == 0) {
+      UInt bit_D  = INSN(22,22);
+      UInt fld_rm = INSN(17,16);
+      UInt fld_d  = INSN(15,12);
+      Bool isF64  = INSN(8,8) == 1;
+      UInt bit_M  = INSN(5,5);
+      UInt fld_m  = INSN(3,0);
+
+      UInt dd = isF64 ? ((bit_D << 4) | fld_d) : ((fld_d << 1) | bit_D);
+      UInt mm = isF64 ? ((bit_M << 4) | fld_m) : ((fld_m << 1) | bit_M);
+
+      if (isT) {
+         gen_SIGILL_T_if_in_ITBlock(old_itstate, new_itstate);
+      }
+      /* In ARM mode, this is statically unconditional.  In Thumb mode,
+         this must be dynamically unconditional, and we've SIGILLd if not.
+         In either case we can create unconditional IR. */
+
+      UChar c = '?';
+      IRRoundingMode rm = Irrm_NEAREST;
+      switch (fld_rm) {
+         /* The use of NEAREST for both the 'a' and 'n' cases is a bit of a
+            kludge since it doesn't take into account the nearest-even vs
+            nearest-away semantics. */
+         case BITS2(0,0): c = 'a'; rm = Irrm_NEAREST; break;
+         case BITS2(0,1): c = 'n'; rm = Irrm_NEAREST; break;
+         case BITS2(1,0): c = 'p'; rm = Irrm_PosINF;  break;
+         case BITS2(1,1): c = 'm'; rm = Irrm_NegINF;  break;
+         default: vassert(0);
+      }
+
+      IRExpr* srcM = (isF64 ? llGetDReg : llGetFReg)(mm);
+      IRExpr* res  = binop(isF64 ? Iop_RoundF64toInt : Iop_RoundF32toInt,
+                           mkU32((UInt)rm), srcM);
+      (isF64 ? llPutDReg : llPutFReg)(dd, res);
+
+      UChar rch = isF64 ? 'd' : 'f';
+      DIP("vrint%c.%s %c%u, %c%u\n",
+          c, isF64 ? "f64" : "f32", rch, dd, rch, mm);
+      return True;
+   }
+   /* fall through */
+
     /* ---------- Doesn't match anything. ---------- */
     return False;
  
diff --git a/VEX/priv/host_arm_defs.c b/VEX/priv/host_arm_defs.c

index 2b18714f022b33b57b912945fff8a577f702ae43..04080dde70c13d3604457d535501f1f523f9fa8b 100644 (file)
--- a/VEX/priv/host_arm_defs.c
+++ b/VEX/priv/host_arm_defs.c
@@ -1365,6 +1365,15 @@ ARMInstr* ARMInstr_VCvtID ( Bool iToD, Bool syned,
     i->ARMin.VCvtID.src   = src;
     return i;
  }
+ARMInstr* ARMInstr_VRIntR ( Bool isF64, HReg dst, HReg src )
+{
+   ARMInstr* i = LibVEX_Alloc_inline(sizeof(ARMInstr));
+   i->tag                = ARMin_VRIntR;
+   i->ARMin.VRIntR.isF64 = isF64;
+   i->ARMin.VRIntR.dst   = dst ;
+   i->ARMin.VRIntR.src   = src;
+   return i;
+}
  ARMInstr* ARMInstr_FPSCR ( Bool toFPSCR, HReg iReg ) {
     ARMInstr* i = LibVEX_Alloc_inline(sizeof(ARMInstr));
     i->tag                 = ARMin_FPSCR;
@@ -1873,6 +1882,14 @@ void ppARMInstr ( const ARMInstr* i ) {
           ppHRegARM(i->ARMin.VCvtID.src);
           return;
        }
+      case ARMin_VRIntR: {
+         const HChar* sz = i->ARMin.VRIntR.isF64 ? "f64" : "f32";
+         vex_printf("vrintr.%s.%s ", sz, sz);
+         ppHRegARM(i->ARMin.VRIntR.dst);
+         vex_printf(", ");
+         ppHRegARM(i->ARMin.VRIntR.src);
+         return;
+      }
        case ARMin_FPSCR:
           if (i->ARMin.FPSCR.toFPSCR) {
              vex_printf("fmxr  fpscr, ");
@@ -2268,6 +2285,10 @@ void getRegUsage_ARMInstr ( HRegUsage* u, const ARMInstr* i, Bool mode64 )
           addHRegUse(u, HRmWrite, i->ARMin.VCvtID.dst);
           addHRegUse(u, HRmRead,  i->ARMin.VCvtID.src);
           return;
+      case ARMin_VRIntR:
+         addHRegUse(u, HRmWrite, i->ARMin.VRIntR.dst);
+         addHRegUse(u, HRmRead,  i->ARMin.VRIntR.src);
+         return;
        case ARMin_FPSCR:
           if (i->ARMin.FPSCR.toFPSCR)
              addHRegUse(u, HRmRead, i->ARMin.FPSCR.iReg);
@@ -2483,6 +2504,10 @@ void mapRegs_ARMInstr ( HRegRemap* m, ARMInstr* i, Bool mode64 )
           i->ARMin.VCvtID.dst = lookupHRegRemap(m, i->ARMin.VCvtID.dst);
           i->ARMin.VCvtID.src = lookupHRegRemap(m, i->ARMin.VCvtID.src);
           return;
+      case ARMin_VRIntR:
+         i->ARMin.VRIntR.dst = lookupHRegRemap(m, i->ARMin.VRIntR.dst);
+         i->ARMin.VRIntR.src = lookupHRegRemap(m, i->ARMin.VRIntR.src);
+         return;
        case ARMin_FPSCR:
           i->ARMin.FPSCR.iReg = lookupHRegRemap(m, i->ARMin.FPSCR.iReg);
           return;
@@ -3852,6 +3877,29 @@ Int emit_ARMInstr ( /*MB_MOD*/Bool* is_profInc,
           /*UNREACHED*/
           vassert(0);
        }
+      case ARMin_VRIntR: { /* NB: ARM v8 and above only */
+         Bool isF64 = i->ARMin.VRIntR.isF64;
+         UInt rDst  = (isF64 ? dregEnc : fregEnc)(i->ARMin.VRIntR.dst);
+         UInt rSrc  = (isF64 ? dregEnc : fregEnc)(i->ARMin.VRIntR.src);
+         /* The encoding of registers here differs strangely for the
+            F32 and F64 cases. */
+         UInt D, Vd, M, Vm;
+         if (isF64) {
+            D  = (rDst >> 4) & 1;
+            Vd = rDst & 0xF;
+            M  = (rSrc >> 4) & 1;
+            Vm = rSrc & 0xF;
+         } else {
+            Vd = (rDst >> 1) & 0xF;
+            D  = rDst & 1;
+            Vm = (rSrc >> 1) & 0xF;
+            M  = rSrc & 1;
+         }
+         vassert(D <= 1 && Vd <= 15 && M <= 1 && Vm <= 15);
+         *p++ = XXXXXXXX(0xE, X1110, X1011 | (D << 2), X0110, Vd,
+                         isF64 ? X1011 : X1010, X0100 | (M << 1), Vm);
+         goto done;
+      }
        case ARMin_FPSCR: {
           Bool toFPSCR = i->ARMin.FPSCR.toFPSCR;
           UInt iReg    = iregEnc(i->ARMin.FPSCR.iReg);
diff --git a/VEX/priv/host_arm_defs.h b/VEX/priv/host_arm_defs.h

index cd2051256aa7bc44a85ac57e348ceeb7bf6482ef..ada0775009d001cc846c24b620657b55e459db5e 100644 (file)
--- a/VEX/priv/host_arm_defs.h
+++ b/VEX/priv/host_arm_defs.h
@@ -595,6 +595,7 @@ typedef
        ARMin_VXferD,
        ARMin_VXferS,
        ARMin_VCvtID,
+      ARMin_VRIntR,
        ARMin_FPSCR,
        ARMin_MFence,
        ARMin_CLREX,
@@ -853,6 +854,13 @@ typedef
              HReg dst;
              HReg src;
           } VCvtID;
+         /* Round a F32 or F64 value to the nearest integral value,
+            according to the FPSCR.RM.  For ARM >= V8 hosts only. */
+         struct {
+            Bool isF64;
+            HReg dst;
+            HReg src;
+         } VRIntR;
           /* Move a 32-bit value to/from the FPSCR (FMXR, FMRX) */
           struct {
              Bool toFPSCR;
@@ -1007,6 +1015,7 @@ extern ARMInstr* ARMInstr_VXferD   ( Bool toD, HReg dD, HReg rHi, HReg rLo );
  extern ARMInstr* ARMInstr_VXferS   ( Bool toS, HReg fD, HReg rLo );
  extern ARMInstr* ARMInstr_VCvtID   ( Bool iToD, Bool syned,
                                       HReg dst, HReg src );
+extern ARMInstr* ARMInstr_VRIntR   ( Bool isF64, HReg dst, HReg src );
  extern ARMInstr* ARMInstr_FPSCR    ( Bool toFPSCR, HReg iReg );
  extern ARMInstr* ARMInstr_MFence   ( void );
  extern ARMInstr* ARMInstr_CLREX    ( void );
diff --git a/VEX/priv/host_arm_isel.c b/VEX/priv/host_arm_isel.c

index 3b093701a4942f17294e1f0d73ea0856e18ad47f..8dd1b4d6127aa09bbaff2a36d06e96a22d39f577 100644 (file)
--- a/VEX/priv/host_arm_isel.c
+++ b/VEX/priv/host_arm_isel.c
@@ -5603,6 +5603,21 @@ static HReg iselDblExpr_wrk ( ISelEnv* env, IRExpr* e )
              addInstr(env, ARMInstr_VUnaryD(ARMvfpu_SQRT, dst, src));
              return dst;
           }
+         case Iop_RoundF64toInt: {
+            /* We can only generate this on a >= V8 capable target.  But
+               that's OK since we should only be asked to generate for V8
+               capable guests, and we assume here that host == guest. */
+            if (VEX_ARM_ARCHLEVEL(env->hwcaps) >= 8) {
+               HReg src = iselDblExpr(env, e->Iex.Binop.arg2);
+               HReg dst = newVRegD(env);
+               set_VFP_rounding_mode(env, e->Iex.Binop.arg1);
+               addInstr(env, ARMInstr_VRIntR(True/*isF64*/, dst, src));
+               set_VFP_rounding_default(env);
+               return dst;
+            }
+            /* not a V8 target, so we can't select insns for this. */
+            break;
+         }
           default:
              break;
        }
@@ -5745,6 +5760,21 @@ static HReg iselFltExpr_wrk ( ISelEnv* env, IRExpr* e )
              set_VFP_rounding_default(env);
              return valS;
           }
+         case Iop_RoundF32toInt: {
+            /* We can only generate this on a >= V8 capable target.  But
+               that's OK since we should only be asked to generate for V8
+               capable guests, and we assume here that host == guest. */
+            if (VEX_ARM_ARCHLEVEL(env->hwcaps) >= 8) {
+               HReg src = iselFltExpr(env, e->Iex.Binop.arg2);
+               HReg dst = newVRegF(env);
+               set_VFP_rounding_mode(env, e->Iex.Binop.arg1);
+               addInstr(env, ARMInstr_VRIntR(False/*!isF64*/, dst, src));
+               set_VFP_rounding_default(env);
+               return dst;
+            }
+            /* not a V8 target, so we can't select insns for this. */
+            break;
+         }
           default:
              break;
        }
author	Julian Seward <jseward@acm.org>
	Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)
committer	Julian Seward <jseward@acm.org>
	Thu, 12 Jan 2017 14:37:58 +0000 (14:37 +0000)
VEX/priv/guest_arm_toIR.c		patch \| blob \| blame \| history
VEX/priv/host_arm_defs.c		patch \| blob \| blame \| history
VEX/priv/host_arm_defs.h		patch \| blob \| blame \| history
VEX/priv/host_arm_isel.c		patch \| blob \| blame \| history