]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
backport: re PR target/61423 (Incorrect conversion from unsigned int to floating...
authorUros Bizjak <ubizjak@gmail.com>
Wed, 18 Jun 2014 20:01:37 +0000 (22:01 +0200)
committerUros Bizjak <uros@gcc.gnu.org>
Wed, 18 Jun 2014 20:01:37 +0000 (22:01 +0200)
Backport from mainline
2014-06-06  Uros Bizjak  <ubizjak@gmail.com>

PR target/61423
* config/i386/i386.md (*floatunssi<mode>2_i387_with_xmm): New
define_insn_and_split pattern, merged from *floatunssi<mode>2_1
and corresponding splitters.  Zero extend general register
or memory input operand to XMM temporary.  Enable for
TARGET_SSE2 and TARGET_INTER_UNIT_MOVES_TO_VEC only.
(floatunssi<mode>2): Update expander predicate.

testsuite/ChangeLog:

Backport from mainline
2014-06-13  Ilya Enkovich  <ilya.enkovich@intel.com>

PR rtl-optimization/61094
PR rtl-optimization/61446
* gcc.target/i386/pr61446.c : New.

Backport from mainline
2014-06-06  Uros Bizjak  <ubizjak@gmail.com>

PR target/61423
* gcc.target/i386/pr61423.c: New test.

From-SVN: r211803

gcc/ChangeLog
gcc/config/i386/i386.md
gcc/testsuite/ChangeLog
gcc/testsuite/gcc.target/i386/pr61423.c [new file with mode: 0644]
gcc/testsuite/gcc.target/i386/pr61446.c [new file with mode: 0644]

index 0652ed5f3c6512c3c54c3c79ed3ab60fb538cb4d..c9bcd2abc4c2152098feafaabc4eee89e13f7127 100644 (file)
@@ -1,3 +1,16 @@
+2014-06-18  Uros Bizjak  <ubizjak@gmail.com>
+
+       Backport from mainline
+       2014-06-06  Uros Bizjak  <ubizjak@gmail.com>
+
+       PR target/61423
+       * config/i386/i386.md (*floatunssi<mode>2_i387_with_xmm): New
+       define_insn_and_split pattern, merged from *floatunssi<mode>2_1
+       and corresponding splitters.  Zero extend general register
+       or memory input operand to XMM temporary.  Enable for
+       TARGET_SSE2 and TARGET_INTER_UNIT_MOVES_TO_VEC only.
+       (floatunssi<mode>2): Update expander predicate.
+
 2014-06-18  Richard Henderson  <rth@redhat.com>
 
        PR target/61545
index 891d4d4f3edb83574e6fdbee1dfce7deb1c8fa45..d5055943f136b703f920025839ddd759ae91b93c 100644 (file)
 
 ;; Avoid store forwarding (partial memory) stall penalty by extending
 ;; SImode value to DImode through XMM register instead of pushing two
-;; SImode values to stack. Note that even !TARGET_INTER_UNIT_MOVES
-;; targets benefit from this optimization. Also note that fild
-;; loads from memory only.
+;; SImode values to stack. Also note that fild loads from memory only.
 
-(define_insn "*floatunssi<mode>2_1"
-  [(set (match_operand:X87MODEF 0 "register_operand" "=f,f")
+(define_insn_and_split "*floatunssi<mode>2_i387_with_xmm"
+  [(set (match_operand:X87MODEF 0 "register_operand" "=f")
        (unsigned_float:X87MODEF
-         (match_operand:SI 1 "nonimmediate_operand" "x,m")))
-   (clobber (match_operand:DI 2 "memory_operand" "=m,m"))
-   (clobber (match_scratch:SI 3 "=X,x"))]
+         (match_operand:SI 1 "nonimmediate_operand" "rm")))
+   (clobber (match_scratch:DI 3 "=x"))
+   (clobber (match_operand:DI 2 "memory_operand" "=m"))]
   "!TARGET_64BIT
    && TARGET_80387 && X87_ENABLE_FLOAT (<X87MODEF:MODE>mode, DImode)
-   && TARGET_SSE"
+   && TARGET_SSE2 && TARGET_INTER_UNIT_MOVES"
   "#"
-  [(set_attr "type" "multi")
-   (set_attr "mode" "<MODE>")])
-
-(define_split
-  [(set (match_operand:X87MODEF 0 "register_operand")
-       (unsigned_float:X87MODEF
-         (match_operand:SI 1 "register_operand")))
-   (clobber (match_operand:DI 2 "memory_operand"))
-   (clobber (match_scratch:SI 3))]
-  "!TARGET_64BIT
-   && TARGET_80387 && X87_ENABLE_FLOAT (<X87MODEF:MODE>mode, DImode)
-   && TARGET_SSE
-   && reload_completed"
-  [(set (match_dup 2) (match_dup 1))
-   (set (match_dup 0)
-       (float:X87MODEF (match_dup 2)))]
-  "operands[1] = simplify_gen_subreg (DImode, operands[1], SImode, 0);")
-
-(define_split
-  [(set (match_operand:X87MODEF 0 "register_operand")
-       (unsigned_float:X87MODEF
-         (match_operand:SI 1 "memory_operand")))
-   (clobber (match_operand:DI 2 "memory_operand"))
-   (clobber (match_scratch:SI 3))]
-  "!TARGET_64BIT
-   && TARGET_80387 && X87_ENABLE_FLOAT (<X87MODEF:MODE>mode, DImode)
-   && TARGET_SSE
-   && reload_completed"
-  [(set (match_dup 2) (match_dup 3))
+  "&& reload_completed"
+  [(set (match_dup 3) (zero_extend:DI (match_dup 1)))
+   (set (match_dup 2) (match_dup 3))
    (set (match_dup 0)
        (float:X87MODEF (match_dup 2)))]
-{
-  emit_move_insn (operands[3], operands[1]);
-  operands[3] = simplify_gen_subreg (DImode, operands[3], SImode, 0);
-})
+  ""
+  [(set_attr "type" "multi")
+   (set_attr "mode" "<MODE>")])
 
 (define_expand "floatunssi<mode>2"
   [(parallel
      [(set (match_operand:X87MODEF 0 "register_operand")
           (unsigned_float:X87MODEF
             (match_operand:SI 1 "nonimmediate_operand")))
-      (clobber (match_dup 2))
-      (clobber (match_scratch:SI 3))])]
+      (clobber (match_scratch:DI 3))
+      (clobber (match_dup 2))])]
   "!TARGET_64BIT
    && ((TARGET_80387 && X87_ENABLE_FLOAT (<X87MODEF:MODE>mode, DImode)
-       && TARGET_SSE)
+       && TARGET_SSE2 && TARGET_INTER_UNIT_MOVES)
        || (SSE_FLOAT_MODE_P (<MODE>mode) && TARGET_SSE_MATH))"
 {
   if (SSE_FLOAT_MODE_P (<MODE>mode) && TARGET_SSE_MATH)
index 8418873c3d9a63f63cfff7de10cb1c9e24055376..5ff54daac1409215b40fae9eadbd7b5a2e959283 100644 (file)
@@ -1,3 +1,18 @@
+2014-06-18  Uros Bizjak  <ubizjak@gmail.com>
+
+       Backport from mainline
+       2014-06-13  Ilya Enkovich  <ilya.enkovich@intel.com>
+
+       PR rtl-optimization/61094
+       PR rtl-optimization/61446
+       * gcc.target/i386/pr61446.c : New.
+
+       Backport from mainline
+       2014-06-06  Uros Bizjak  <ubizjak@gmail.com>
+
+       PR target/61423
+       * gcc.target/i386/pr61423.c: New test.
+
 2014-06-17  Yufeng Zhang  <yufeng.zhang@arm.com>
 
        Backport from mainline
diff --git a/gcc/testsuite/gcc.target/i386/pr61423.c b/gcc/testsuite/gcc.target/i386/pr61423.c
new file mode 100644 (file)
index 0000000..5b538a2
--- /dev/null
@@ -0,0 +1,38 @@
+/* PR target/61423 */
+/* { dg-do run { target ia32 } } */
+/* { dg-options "-O1 -ftree-vectorize -msse2 -mfpmath=387 -mtune=core2" } */
+
+#define N 1024
+static unsigned int A[N];
+
+double
+__attribute__((noinline))
+func (void)
+{
+  unsigned int sum = 0;
+  unsigned i;
+  double t;
+
+  for (i = 0; i < N; i++)
+    sum += A[i];
+
+  t = sum;
+  return t;
+}
+
+int
+main ()
+{
+  unsigned i;
+  double d;
+
+  for(i = 0; i < N; i++)
+    A[i] = 1;
+
+  d = func();
+
+  if (d != 1024.0)
+    __builtin_abort ();
+
+  return 0;
+}
diff --git a/gcc/testsuite/gcc.target/i386/pr61446.c b/gcc/testsuite/gcc.target/i386/pr61446.c
new file mode 100644 (file)
index 0000000..fc32f63
--- /dev/null
@@ -0,0 +1,14 @@
+/* PR rtl-optimization/61446 */
+
+/* { dg-do compile { target { ia32 } } } */
+/* { dg-options "-O2 -march=corei7 -mfpmath=387" } */
+
+unsigned long long
+foo (float a)
+{
+  const double dfa = a;
+  const unsigned int hi = dfa / 0x1p32f;
+  const unsigned int lo = dfa - (double) hi * 0x1p32f;
+
+  return ((unsigned long long) hi << (4 * (8))) | lo;
+}