Merge, from branches/COMEM, revisions 2568 to 2641.

author Julian Seward <jseward@acm.org>

Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)

committer Julian Seward <jseward@acm.org>

Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)
author Julian Seward <jseward@acm.org>
Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)
committer Julian Seward <jseward@acm.org>
Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)
diff --cc VEX/priv/guest_arm_toIR.c
Simple merge
diff --cc VEX/priv/host_amd64_isel.c

index 9c2c1070aef4f85ab71a0bdaf916c0303925b3be,9063b3fc84ccca3689213426fb827283f0452ebb..5a13711496ebe881e7fcca757632074b118f1884
--- 1/VEX/priv/host_amd64_isel.c
--- 2/VEX/priv/host_amd64_isel.c
+++ b/VEX/priv/host_amd64_isel.c
@@@ -1605,36 -1607,6 +1607,37 @@@ static HReg iselIntExpr_R_wrk ( ISelEnv
               return dst;
            }
   
-             addInstr(env, AMD64Instr_Call( Acc_ALWAYS, (ULong)fn, 2 ));
+ +         case Iop_GetMSBs8x16: {
+ +            /* Note: the following assumes the helper is of signature
+ +                  UInt fn ( ULong w64hi, ULong w64Lo ),
+ +               and is not a regparm fn. */
+ +            HReg dst = newVRegI(env);
+ +            HReg vec = iselVecExpr(env, e->Iex.Unop.arg);
+ +            HReg rsp = hregAMD64_RSP();
+ +            fn = (HWord)h_generic_calc_GetMSBs8x16;
+ +            AMD64AMode* m8_rsp  = AMD64AMode_IR( -8, rsp);
+ +            AMD64AMode* m16_rsp = AMD64AMode_IR(-16, rsp);
+ +            addInstr(env, AMD64Instr_SseLdSt(False/*store*/,
+ +                                             16, vec, m16_rsp));
+ +            /* hi 64 bits into RDI -- the first arg */
+ +            addInstr(env, AMD64Instr_Alu64R( Aalu_MOV, 
+ +                                             AMD64RMI_Mem(m8_rsp),
+ +                                             hregAMD64_RDI() )); /* 1st arg */
+ +            /* lo 64 bits into RSI -- the 2nd arg */
+ +            addInstr(env, AMD64Instr_Alu64R( Aalu_MOV, 
+ +                                             AMD64RMI_Mem(m16_rsp),
+ +                                             hregAMD64_RSI() )); /* 2nd arg */
++            addInstr(env, AMD64Instr_Call( Acc_ALWAYS, (ULong)fn,
++                                           2, RetLocInt ));
+ +            /* MovxLQ is not exactly the right thing here.  We just
+ +               need to get the bottom 16 bits of RAX into dst, and zero
+ +               out everything else.  Assuming that the helper returns
+ +               a UInt with the top 16 bits zeroed out, it'll do,
+ +               though. */
+ +            addInstr(env, AMD64Instr_MovxLQ(False, hregAMD64_RAX(), dst));
+ +            return dst;
+ +         }
+ +
            default: 
               break;
         }
diff --cc VEX/priv/host_arm_isel.c
Simple merge
diff --cc VEX/priv/host_ppc_isel.c
Simple merge
diff --cc VEX/priv/host_s390_defs.c
Simple merge
diff --cc VEX/priv/ir_defs.c
Simple merge
diff --cc VEX/priv/ir_opt.c

index 89db9ea38050c5a683635bae074f52d6de3858cc,c8d018f2b580dfd7efbddbe6bc43671c57b73b9a..3c52c173737dc4ea59ecb5519923328fadc63f6d
--- 1/VEX/priv/ir_opt.c
--- 2/VEX/priv/ir_opt.c
+++ b/VEX/priv/ir_opt.c
@@@ -2399,6 -2439,62 +2431,62 @@@ static IRStmt* subst_and_fold_Stmt ( IR
                      fold_Expr(env, subst_Expr(env, st->Ist.Store.data))
                   );
   
- -            we can replace it with a NoOp, but if the guard folds down
- -            to 'true', we can't conveniently replace it with an
- -            unconditional load, because doing so requires generating a
- -            new temporary, and that is not easy to do at this
- -            point. */
+       case Ist_StoreG: {
+          IRStoreG* sg = st->Ist.StoreG.details;
+          vassert(isIRAtom(sg->addr));
+          vassert(isIRAtom(sg->data));
+          vassert(isIRAtom(sg->guard));
+          IRExpr* faddr  = fold_Expr(env, subst_Expr(env, sg->addr));
+          IRExpr* fdata  = fold_Expr(env, subst_Expr(env, sg->data));
+          IRExpr* fguard = fold_Expr(env, subst_Expr(env, sg->guard));
+          if (fguard->tag == Iex_Const) {
+             /* The condition on this store has folded down to a constant. */
+             vassert(fguard->Iex.Const.con->tag == Ico_U1);
+             if (fguard->Iex.Const.con->Ico.U1 == False) {
+                return IRStmt_NoOp();
+             } else {
+                vassert(fguard->Iex.Const.con->Ico.U1 == True);
+                return IRStmt_Store(sg->end, faddr, fdata);
+             }
+          }
+          return IRStmt_StoreG(sg->end, faddr, fdata, fguard);
+       }
+ 
+       case Ist_LoadG: {
+          /* This is complicated.  If the guard folds down to 'false',
++            we can replace it with an assignment 'dst := alt', but if
++            the guard folds down to 'true', we can't conveniently
++            replace it with an unconditional load, because doing so
++            requires generating a new temporary, and that is not easy
++            to do at this point. */
+          IRLoadG* lg = st->Ist.LoadG.details;
+          vassert(isIRAtom(lg->addr));
+          vassert(isIRAtom(lg->alt));
+          vassert(isIRAtom(lg->guard));
+          IRExpr* faddr  = fold_Expr(env, subst_Expr(env, lg->addr));
+          IRExpr* falt   = fold_Expr(env, subst_Expr(env, lg->alt));
+          IRExpr* fguard = fold_Expr(env, subst_Expr(env, lg->guard));
+          if (fguard->tag == Iex_Const) {
+             /* The condition on this load has folded down to a constant. */
+             vassert(fguard->Iex.Const.con->tag == Ico_U1);
+             if (fguard->Iex.Const.con->Ico.U1 == False) {
+                /* The load is not going to happen -- instead 'alt' is
+                   assigned to 'dst'.  */
+                return IRStmt_WrTmp(lg->dst, falt);
+             } else {
+                vassert(fguard->Iex.Const.con->Ico.U1 == True);
+                /* The load is always going to happen.  We want to
+                   convert to an unconditional load and assign to 'dst'
+                   (IRStmt_WrTmp).  Problem is we need an extra temp to
+                   hold the loaded value, but none is available.
+                   Instead, reconstitute the conditional load (with
+                   folded args, of course) and let the caller of this
+                   routine deal with the problem. */
+             }
+          }
+          return IRStmt_LoadG(lg->end, lg->cvt, lg->dst, faddr, falt, fguard);
+       }
+ 
         case Ist_CAS: {
            IRCAS *cas, *cas2;
            cas = st->Ist.CAS.details;
diff --cc VEX/pub/libvex_ir.h

index 1a34ca311d6c5a58fa787d320252097eb795e86b,715d85d0704500d9c310aab31161da2b7e368ff2..c132995320b1141493cf894fdca6bece5cd5a281
--- 1/VEX/pub/libvex_ir.h
--- 2/VEX/pub/libvex_ir.h
+++ b/VEX/pub/libvex_ir.h
@@@ -1980,12 -1920,13 +1981,12 @@@ extern void ppIRJumpKind ( IRJumpKind )
      In order that instrumentation is possible, the call must state, and
      state correctly:
   
-    * whether it reads, writes or modifies memory, and if so where
-      (only one chunk can be stated)
- -   * whether it reads, writes or modifies memory, and if so where Only
- -     one chunk can be stated, although it is allowed to repeat some
- -     number of times at a fixed interval.
++   * Whether it reads, writes or modifies memory, and if so where.
   
--   * whether it reads, writes or modifies guest state, and if so which
-      pieces (several pieces may be stated, and currently their extents
-      must be known at translation-time).
++   * Whether it reads, writes or modifies guest state, and if so which
+      pieces.  Several pieces may be stated, and their extents must be
- -     known at translation-time.
++     known at translation-time.  Each piece is allowed to repeat some
++     number of times at a fixed interval, if required.
   
      Normally, code is generated to pass just the args to the helper.
      However, if .needsBBP is set, then an extra first argument is
author	Julian Seward <jseward@acm.org>
	Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)
committer	Julian Seward <jseward@acm.org>
	Thu, 17 Jan 2013 14:23:53 +0000 (14:23 +0000)
		1	2
VEX/priv/guest_arm_toIR.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/host_amd64_isel.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/host_arm_isel.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/host_ppc_isel.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/host_s390_defs.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/ir_defs.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/priv/ir_opt.c	patch \|	diff1 \|	diff2 \|	blob \| history
VEX/pub/libvex_ir.h	patch \|	diff1 \|	diff2 \|	blob \| history