gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "memmodel.h"
  29 #include "predict.h"
  30 #include "tm_p.h"
  31 #include "expmed.h"
  32 #include "optabs.h"
  33 #include "emit-rtl.h"
  34 #include "recog.h"
  35 #include "diagnostic-core.h"
  36
  37 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  38    is properly defined.  */
  39 #include "stor-layout.h"
  40 #include "except.h"
  41 #include "dojump.h"
  42 #include "explow.h"
  43 #include "expr.h"
  44 #include "optabs-tree.h"
  45 #include "libfuncs.h"
  46
  47 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  48                                    machine_mode *);
  49 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  50 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  51
  52 /* Debug facility for use in GDB.  */
  53 void debug_optab_libfuncs (void);
  54 \f
  55 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
  56    the result of operation CODE applied to OP0 (and OP1 if it is a binary
  57    operation).
  58
  59    If the last insn does not set TARGET, don't do anything, but return 1.
  60
  61    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
  62    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
  63    try again, ensuring that TARGET is not one of the operands.  */
  64
  65 static int
  66 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
  67 {
  68   rtx_insn *last_insn;
  69   rtx set;
  70   rtx note;
  71
  72   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
  73
  74   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
  75       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
  76       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
  77       && GET_RTX_CLASS (code) != RTX_COMPARE
  78       && GET_RTX_CLASS (code) != RTX_UNARY)
  79     return 1;
  80
  81   if (GET_CODE (target) == ZERO_EXTRACT)
  82     return 1;
  83
  84   for (last_insn = insns;
  85        NEXT_INSN (last_insn) != NULL_RTX;
  86        last_insn = NEXT_INSN (last_insn))
  87     ;
  88
  89   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
  90      a value changing in the insn, so the note would be invalid for CSE.  */
  91   if (reg_overlap_mentioned_p (target, op0)
  92       || (op1 && reg_overlap_mentioned_p (target, op1)))
  93     {
  94       if (MEM_P (target)
  95           && (rtx_equal_p (target, op0)
  96               || (op1 && rtx_equal_p (target, op1))))
  97         {
  98           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
  99              over expanding it as temp = MEM op X, MEM = temp.  If the target
 100              supports MEM = MEM op X instructions, it is sometimes too hard
 101              to reconstruct that form later, especially if X is also a memory,
 102              and due to multiple occurrences of addresses the address might
 103              be forced into register unnecessarily.
 104              Note that not emitting the REG_EQUIV note might inhibit
 105              CSE in some cases.  */
 106           set = single_set (last_insn);
 107           if (set
 108               && GET_CODE (SET_SRC (set)) == code
 109               && MEM_P (SET_DEST (set))
 110               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 111                   || (op1 && rtx_equal_p (SET_DEST (set),
 112                                           XEXP (SET_SRC (set), 1)))))
 113             return 1;
 114         }
 115       return 0;
 116     }
 117
 118   set = set_for_reg_notes (last_insn);
 119   if (set == NULL_RTX)
 120     return 1;
 121
 122   if (! rtx_equal_p (SET_DEST (set), target)
 123       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 124       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 125           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 126     return 1;
 127
 128   if (GET_RTX_CLASS (code) == RTX_UNARY)
 129     switch (code)
 130       {
 131       case FFS:
 132       case CLZ:
 133       case CTZ:
 134       case CLRSB:
 135       case POPCOUNT:
 136       case PARITY:
 137       case BSWAP:
 138         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 139           {
 140             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 141             if (GET_MODE_SIZE (GET_MODE (op0))
 142                 > GET_MODE_SIZE (GET_MODE (target)))
 143               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 144                                          note, GET_MODE (op0));
 145             else
 146               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 147                                          note, GET_MODE (op0));
 148             break;
 149           }
 150         /* FALLTHRU */
 151       default:
 152         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 153         break;
 154       }
 155   else
 156     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 157
 158   set_unique_reg_note (last_insn, REG_EQUAL, note);
 159
 160   return 1;
 161 }
 162 \f
 163 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 164    for a widening operation would be.  In most cases this would be OP0, but if
 165    that's a constant it'll be VOIDmode, which isn't useful.  */
 166
 167 static machine_mode
 168 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 169 {
 170   machine_mode m0 = GET_MODE (op0);
 171   machine_mode m1 = GET_MODE (op1);
 172   machine_mode result;
 173
 174   if (m0 == VOIDmode && m1 == VOIDmode)
 175     return to_mode;
 176   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 177     result = m1;
 178   else
 179     result = m0;
 180
 181   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 182     return to_mode;
 183
 184   return result;
 185 }
 186 \f
 187 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 188    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 189    not actually do a sign-extend or zero-extend, but can leave the
 190    higher-order bits of the result rtx undefined, for example, in the case
 191    of logical operations, but not right shifts.  */
 192
 193 static rtx
 194 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 195                int unsignedp, int no_extend)
 196 {
 197   rtx result;
 198   scalar_int_mode int_mode;
 199
 200   /* If we don't have to extend and this is a constant, return it.  */
 201   if (no_extend && GET_MODE (op) == VOIDmode)
 202     return op;
 203
 204   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 205      extend since it will be more efficient to do so unless the signedness of
 206      a promoted object differs from our extension.  */
 207   if (! no_extend
 208       || !is_a <scalar_int_mode> (mode, &int_mode)
 209       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 210           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 211     return convert_modes (mode, oldmode, op, unsignedp);
 212
 213   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 214      SUBREG.  */
 215   if (GET_MODE_SIZE (int_mode) <= UNITS_PER_WORD)
 216     return gen_lowpart (int_mode, force_reg (GET_MODE (op), op));
 217
 218   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 219      part to OP.  */
 220
 221   result = gen_reg_rtx (int_mode);
 222   emit_clobber (result);
 223   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 224   return result;
 225 }
 226 \f
 227 /* Expand vector widening operations.
 228
 229    There are two different classes of operations handled here:
 230    1) Operations whose result is wider than all the arguments to the operation.
 231       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 232       In this case OP0 and optionally OP1 would be initialized,
 233       but WIDE_OP wouldn't (not relevant for this case).
 234    2) Operations whose result is of the same size as the last argument to the
 235       operation, but wider than all the other arguments to the operation.
 236       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 237       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 238
 239    E.g, when called to expand the following operations, this is how
 240    the arguments will be initialized:
 241                                 nops    OP0     OP1     WIDE_OP
 242    widening-sum                 2       oprnd0  -       oprnd1
 243    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 244    widening-mult                2       oprnd0  oprnd1  -
 245    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 246
 247 rtx
 248 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 249                            rtx target, int unsignedp)
 250 {
 251   struct expand_operand eops[4];
 252   tree oprnd0, oprnd1, oprnd2;
 253   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 254   optab widen_pattern_optab;
 255   enum insn_code icode;
 256   int nops = TREE_CODE_LENGTH (ops->code);
 257   int op;
 258
 259   oprnd0 = ops->op0;
 260   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 261   widen_pattern_optab =
 262     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 263   if (ops->code == WIDEN_MULT_PLUS_EXPR
 264       || ops->code == WIDEN_MULT_MINUS_EXPR)
 265     icode = find_widening_optab_handler (widen_pattern_optab,
 266                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 267                                          tmode0, 0);
 268   else
 269     icode = optab_handler (widen_pattern_optab, tmode0);
 270   gcc_assert (icode != CODE_FOR_nothing);
 271
 272   if (nops >= 2)
 273     {
 274       oprnd1 = ops->op1;
 275       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 276     }
 277
 278   /* The last operand is of a wider mode than the rest of the operands.  */
 279   if (nops == 2)
 280     wmode = tmode1;
 281   else if (nops == 3)
 282     {
 283       gcc_assert (tmode1 == tmode0);
 284       gcc_assert (op1);
 285       oprnd2 = ops->op2;
 286       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 287     }
 288
 289   op = 0;
 290   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 291   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 292   if (op1)
 293     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 294   if (wide_op)
 295     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 296   expand_insn (icode, op, eops);
 297   return eops[0].value;
 298 }
 299
 300 /* Generate code to perform an operation specified by TERNARY_OPTAB
 301    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 302
 303    UNSIGNEDP is for the case where we have to widen the operands
 304    to perform the operation.  It says to use zero-extension.
 305
 306    If TARGET is nonzero, the value
 307    is generated there, if it is convenient to do so.
 308    In all cases an rtx is returned for the locus of the value;
 309    this may or may not be TARGET.  */
 310
 311 rtx
 312 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 313                    rtx op1, rtx op2, rtx target, int unsignedp)
 314 {
 315   struct expand_operand ops[4];
 316   enum insn_code icode = optab_handler (ternary_optab, mode);
 317
 318   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 319
 320   create_output_operand (&ops[0], target, mode);
 321   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 322   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 323   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 324   expand_insn (icode, 4, ops);
 325   return ops[0].value;
 326 }
 327
 328
 329 /* Like expand_binop, but return a constant rtx if the result can be
 330    calculated at compile time.  The arguments and return value are
 331    otherwise the same as for expand_binop.  */
 332
 333 rtx
 334 simplify_expand_binop (machine_mode mode, optab binoptab,
 335                        rtx op0, rtx op1, rtx target, int unsignedp,
 336                        enum optab_methods methods)
 337 {
 338   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 339     {
 340       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 341                                          mode, op0, op1);
 342       if (x)
 343         return x;
 344     }
 345
 346   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 347 }
 348
 349 /* Like simplify_expand_binop, but always put the result in TARGET.
 350    Return true if the expansion succeeded.  */
 351
 352 bool
 353 force_expand_binop (machine_mode mode, optab binoptab,
 354                     rtx op0, rtx op1, rtx target, int unsignedp,
 355                     enum optab_methods methods)
 356 {
 357   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 358                                  target, unsignedp, methods);
 359   if (x == 0)
 360     return false;
 361   if (x != target)
 362     emit_move_insn (target, x);
 363   return true;
 364 }
 365
 366 /* Create a new vector value in VMODE with all elements set to OP.  The
 367    mode of OP must be the element mode of VMODE.  If OP is a constant,
 368    then the return value will be a constant.  */
 369
 370 static rtx
 371 expand_vector_broadcast (machine_mode vmode, rtx op)
 372 {
 373   enum insn_code icode;
 374   rtvec vec;
 375   rtx ret;
 376   int i, n;
 377
 378   gcc_checking_assert (VECTOR_MODE_P (vmode));
 379
 380   n = GET_MODE_NUNITS (vmode);
 381   vec = rtvec_alloc (n);
 382   for (i = 0; i < n; ++i)
 383     RTVEC_ELT (vec, i) = op;
 384
 385   if (CONSTANT_P (op))
 386     return gen_rtx_CONST_VECTOR (vmode, vec);
 387
 388   /* ??? If the target doesn't have a vec_init, then we have no easy way
 389      of performing this operation.  Most of this sort of generic support
 390      is hidden away in the vector lowering support in gimple.  */
 391   icode = convert_optab_handler (vec_init_optab, vmode,
 392                                  GET_MODE_INNER (vmode));
 393   if (icode == CODE_FOR_nothing)
 394     return NULL;
 395
 396   ret = gen_reg_rtx (vmode);
 397   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 398
 399   return ret;
 400 }
 401
 402 /* This subroutine of expand_doubleword_shift handles the cases in which
 403    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 404    value are the same as for the parent routine, except that SUPERWORD_OP1
 405    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 406    INTO_TARGET may be null if the caller has decided to calculate it.  */
 407
 408 static bool
 409 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 410                         rtx outof_target, rtx into_target,
 411                         int unsignedp, enum optab_methods methods)
 412 {
 413   if (into_target != 0)
 414     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 415                              into_target, unsignedp, methods))
 416       return false;
 417
 418   if (outof_target != 0)
 419     {
 420       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 421          of the sign bit, otherwise we must fill it with zeros.  */
 422       if (binoptab != ashr_optab)
 423         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 424       else
 425         if (!force_expand_binop (word_mode, binoptab,
 426                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 427                                  outof_target, unsignedp, methods))
 428           return false;
 429     }
 430   return true;
 431 }
 432
 433 /* This subroutine of expand_doubleword_shift handles the cases in which
 434    the effective shift value is < BITS_PER_WORD.  The arguments and return
 435    value are the same as for the parent routine.  */
 436
 437 static bool
 438 expand_subword_shift (scalar_int_mode op1_mode, optab binoptab,
 439                       rtx outof_input, rtx into_input, rtx op1,
 440                       rtx outof_target, rtx into_target,
 441                       int unsignedp, enum optab_methods methods,
 442                       unsigned HOST_WIDE_INT shift_mask)
 443 {
 444   optab reverse_unsigned_shift, unsigned_shift;
 445   rtx tmp, carries;
 446
 447   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 448   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 449
 450   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 451      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 452      the opposite direction to BINOPTAB.  */
 453   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 454     {
 455       carries = outof_input;
 456       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 457                                             op1_mode), op1_mode);
 458       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 459                                    0, true, methods);
 460     }
 461   else
 462     {
 463       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 464          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 465          has unknown behavior.  Do a single shift first, then shift by the
 466          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 467          are truncated to the mode size.  */
 468       carries = expand_binop (word_mode, reverse_unsigned_shift,
 469                               outof_input, const1_rtx, 0, unsignedp, methods);
 470       if (shift_mask == BITS_PER_WORD - 1)
 471         {
 472           tmp = immed_wide_int_const
 473             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 474           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 475                                        0, true, methods);
 476         }
 477       else
 478         {
 479           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 480                                                 op1_mode), op1_mode);
 481           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 482                                        0, true, methods);
 483         }
 484     }
 485   if (tmp == 0 || carries == 0)
 486     return false;
 487   carries = expand_binop (word_mode, reverse_unsigned_shift,
 488                           carries, tmp, 0, unsignedp, methods);
 489   if (carries == 0)
 490     return false;
 491
 492   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 493      so the result can go directly into INTO_TARGET if convenient.  */
 494   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 495                       into_target, unsignedp, methods);
 496   if (tmp == 0)
 497     return false;
 498
 499   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 500   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 501                            into_target, unsignedp, methods))
 502     return false;
 503
 504   /* Use a standard word_mode shift for the out-of half.  */
 505   if (outof_target != 0)
 506     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 507                              outof_target, unsignedp, methods))
 508       return false;
 509
 510   return true;
 511 }
 512
 513
 514 /* Try implementing expand_doubleword_shift using conditional moves.
 515    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 516    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 517    are the shift counts to use in the former and latter case.  All other
 518    arguments are the same as the parent routine.  */
 519
 520 static bool
 521 expand_doubleword_shift_condmove (scalar_int_mode op1_mode, optab binoptab,
 522                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 523                                   rtx outof_input, rtx into_input,
 524                                   rtx subword_op1, rtx superword_op1,
 525                                   rtx outof_target, rtx into_target,
 526                                   int unsignedp, enum optab_methods methods,
 527                                   unsigned HOST_WIDE_INT shift_mask)
 528 {
 529   rtx outof_superword, into_superword;
 530
 531   /* Put the superword version of the output into OUTOF_SUPERWORD and
 532      INTO_SUPERWORD.  */
 533   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 534   if (outof_target != 0 && subword_op1 == superword_op1)
 535     {
 536       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 537          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 538       into_superword = outof_target;
 539       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 540                                    outof_superword, 0, unsignedp, methods))
 541         return false;
 542     }
 543   else
 544     {
 545       into_superword = gen_reg_rtx (word_mode);
 546       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 547                                    outof_superword, into_superword,
 548                                    unsignedp, methods))
 549         return false;
 550     }
 551
 552   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 553   if (!expand_subword_shift (op1_mode, binoptab,
 554                              outof_input, into_input, subword_op1,
 555                              outof_target, into_target,
 556                              unsignedp, methods, shift_mask))
 557     return false;
 558
 559   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 560      might be the current value of OUTOF_TARGET.  */
 561   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 562                               into_target, into_superword, word_mode, false))
 563     return false;
 564
 565   if (outof_target != 0)
 566     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 567                                 outof_target, outof_superword,
 568                                 word_mode, false))
 569       return false;
 570
 571   return true;
 572 }
 573
 574 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 575    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 576    input operand; the shift moves bits in the direction OUTOF_INPUT->
 577    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 578    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 579    If OP1 is constant, it will have been truncated as appropriate
 580    and is known to be nonzero.
 581
 582    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 583    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 584    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 585
 586    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 587    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 588    fill with zeros or sign bits as appropriate.
 589
 590    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 591    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 592    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 593    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 594    are undefined.
 595
 596    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
 597    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
 598    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
 599    function wants to calculate it itself.
 600
 601    Return true if the shift could be successfully synthesized.  */
 602
 603 static bool
 604 expand_doubleword_shift (scalar_int_mode op1_mode, optab binoptab,
 605                          rtx outof_input, rtx into_input, rtx op1,
 606                          rtx outof_target, rtx into_target,
 607                          int unsignedp, enum optab_methods methods,
 608                          unsigned HOST_WIDE_INT shift_mask)
 609 {
 610   rtx superword_op1, tmp, cmp1, cmp2;
 611   enum rtx_code cmp_code;
 612
 613   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
 614      fill the result with sign or zero bits as appropriate.  If so, the value
 615      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
 616      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
 617      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
 618
 619      This isn't worthwhile for constant shifts since the optimizers will
 620      cope better with in-range shift counts.  */
 621   if (shift_mask >= BITS_PER_WORD
 622       && outof_target != 0
 623       && !CONSTANT_P (op1))
 624     {
 625       if (!expand_doubleword_shift (op1_mode, binoptab,
 626                                     outof_input, into_input, op1,
 627                                     0, into_target,
 628                                     unsignedp, methods, shift_mask))
 629         return false;
 630       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 631                                outof_target, unsignedp, methods))
 632         return false;
 633       return true;
 634     }
 635
 636   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
 637      is true when the effective shift value is less than BITS_PER_WORD.
 638      Set SUPERWORD_OP1 to the shift count that should be used to shift
 639      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
 640   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
 641   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
 642     {
 643       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
 644          is a subword shift count.  */
 645       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
 646                                     0, true, methods);
 647       cmp2 = CONST0_RTX (op1_mode);
 648       cmp_code = EQ;
 649       superword_op1 = op1;
 650     }
 651   else
 652     {
 653       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
 654       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
 655                                     0, true, methods);
 656       cmp2 = CONST0_RTX (op1_mode);
 657       cmp_code = LT;
 658       superword_op1 = cmp1;
 659     }
 660   if (cmp1 == 0)
 661     return false;
 662
 663   /* If we can compute the condition at compile time, pick the
 664      appropriate subroutine.  */
 665   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
 666   if (tmp != 0 && CONST_INT_P (tmp))
 667     {
 668       if (tmp == const0_rtx)
 669         return expand_superword_shift (binoptab, outof_input, superword_op1,
 670                                        outof_target, into_target,
 671                                        unsignedp, methods);
 672       else
 673         return expand_subword_shift (op1_mode, binoptab,
 674                                      outof_input, into_input, op1,
 675                                      outof_target, into_target,
 676                                      unsignedp, methods, shift_mask);
 677     }
 678
 679   /* Try using conditional moves to generate straight-line code.  */
 680   if (HAVE_conditional_move)
 681     {
 682       rtx_insn *start = get_last_insn ();
 683       if (expand_doubleword_shift_condmove (op1_mode, binoptab,
 684                                             cmp_code, cmp1, cmp2,
 685                                             outof_input, into_input,
 686                                             op1, superword_op1,
 687                                             outof_target, into_target,
 688                                             unsignedp, methods, shift_mask))
 689         return true;
 690       delete_insns_since (start);
 691     }
 692
 693   /* As a last resort, use branches to select the correct alternative.  */
 694   rtx_code_label *subword_label = gen_label_rtx ();
 695   rtx_code_label *done_label = gen_label_rtx ();
 696
 697   NO_DEFER_POP;
 698   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
 699                            0, 0, subword_label,
 700                            profile_probability::uninitialized ());
 701   OK_DEFER_POP;
 702
 703   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 704                                outof_target, into_target,
 705                                unsignedp, methods))
 706     return false;
 707
 708   emit_jump_insn (targetm.gen_jump (done_label));
 709   emit_barrier ();
 710   emit_label (subword_label);
 711
 712   if (!expand_subword_shift (op1_mode, binoptab,
 713                              outof_input, into_input, op1,
 714                              outof_target, into_target,
 715                              unsignedp, methods, shift_mask))
 716     return false;
 717
 718   emit_label (done_label);
 719   return true;
 720 }
 721 \f
 722 /* Subroutine of expand_binop.  Perform a double word multiplication of
 723    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
 724    as the target's word_mode.  This function return NULL_RTX if anything
 725    goes wrong, in which case it may have already emitted instructions
 726    which need to be deleted.
 727
 728    If we want to multiply two two-word values and have normal and widening
 729    multiplies of single-word values, we can do this with three smaller
 730    multiplications.
 731
 732    The multiplication proceeds as follows:
 733                                  _______________________
 734                                 [__op0_high_|__op0_low__]
 735                                  _______________________
 736         *                       [__op1_high_|__op1_low__]
 737         _______________________________________________
 738                                  _______________________
 739     (1)                         [__op0_low__*__op1_low__]
 740                      _______________________
 741     (2a)            [__op0_low__*__op1_high_]
 742                      _______________________
 743     (2b)            [__op0_high_*__op1_low__]
 744          _______________________
 745     (3) [__op0_high_*__op1_high_]
 746
 747
 748   This gives a 4-word result.  Since we are only interested in the
 749   lower 2 words, partial result (3) and the upper words of (2a) and
 750   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
 751   calculated using non-widening multiplication.
 752
 753   (1), however, needs to be calculated with an unsigned widening
 754   multiplication.  If this operation is not directly supported we
 755   try using a signed widening multiplication and adjust the result.
 756   This adjustment works as follows:
 757
 758       If both operands are positive then no adjustment is needed.
 759
 760       If the operands have different signs, for example op0_low < 0 and
 761       op1_low >= 0, the instruction treats the most significant bit of
 762       op0_low as a sign bit instead of a bit with significance
 763       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
 764       with 2**BITS_PER_WORD - op0_low, and two's complements the
 765       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
 766       the result.
 767
 768       Similarly, if both operands are negative, we need to add
 769       (op0_low + op1_low) * 2**BITS_PER_WORD.
 770
 771       We use a trick to adjust quickly.  We logically shift op0_low right
 772       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
 773       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
 774       logical shift exists, we do an arithmetic right shift and subtract
 775       the 0 or -1.  */
 776
 777 static rtx
 778 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
 779                        bool umulp, enum optab_methods methods)
 780 {
 781   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
 782   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
 783   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
 784   rtx product, adjust, product_high, temp;
 785
 786   rtx op0_high = operand_subword_force (op0, high, mode);
 787   rtx op0_low = operand_subword_force (op0, low, mode);
 788   rtx op1_high = operand_subword_force (op1, high, mode);
 789   rtx op1_low = operand_subword_force (op1, low, mode);
 790
 791   /* If we're using an unsigned multiply to directly compute the product
 792      of the low-order words of the operands and perform any required
 793      adjustments of the operands, we begin by trying two more multiplications
 794      and then computing the appropriate sum.
 795
 796      We have checked above that the required addition is provided.
 797      Full-word addition will normally always succeed, especially if
 798      it is provided at all, so we don't worry about its failure.  The
 799      multiplication may well fail, however, so we do handle that.  */
 800
 801   if (!umulp)
 802     {
 803       /* ??? This could be done with emit_store_flag where available.  */
 804       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
 805                            NULL_RTX, 1, methods);
 806       if (temp)
 807         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
 808                                  NULL_RTX, 0, OPTAB_DIRECT);
 809       else
 810         {
 811           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
 812                                NULL_RTX, 0, methods);
 813           if (!temp)
 814             return NULL_RTX;
 815           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
 816                                    NULL_RTX, 0, OPTAB_DIRECT);
 817         }
 818
 819       if (!op0_high)
 820         return NULL_RTX;
 821     }
 822
 823   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
 824                          NULL_RTX, 0, OPTAB_DIRECT);
 825   if (!adjust)
 826     return NULL_RTX;
 827
 828   /* OP0_HIGH should now be dead.  */
 829
 830   if (!umulp)
 831     {
 832       /* ??? This could be done with emit_store_flag where available.  */
 833       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
 834                            NULL_RTX, 1, methods);
 835       if (temp)
 836         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
 837                                  NULL_RTX, 0, OPTAB_DIRECT);
 838       else
 839         {
 840           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
 841                                NULL_RTX, 0, methods);
 842           if (!temp)
 843             return NULL_RTX;
 844           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
 845                                    NULL_RTX, 0, OPTAB_DIRECT);
 846         }
 847
 848       if (!op1_high)
 849         return NULL_RTX;
 850     }
 851
 852   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
 853                        NULL_RTX, 0, OPTAB_DIRECT);
 854   if (!temp)
 855     return NULL_RTX;
 856
 857   /* OP1_HIGH should now be dead.  */
 858
 859   adjust = expand_binop (word_mode, add_optab, adjust, temp,
 860                          NULL_RTX, 0, OPTAB_DIRECT);
 861
 862   if (target && !REG_P (target))
 863     target = NULL_RTX;
 864
 865   if (umulp)
 866     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
 867                             target, 1, OPTAB_DIRECT);
 868   else
 869     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
 870                             target, 1, OPTAB_DIRECT);
 871
 872   if (!product)
 873     return NULL_RTX;
 874
 875   product_high = operand_subword (product, high, 1, mode);
 876   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
 877                          NULL_RTX, 0, OPTAB_DIRECT);
 878   emit_move_insn (product_high, adjust);
 879   return product;
 880 }
 881 \f
 882 /* Wrapper around expand_binop which takes an rtx code to specify
 883    the operation to perform, not an optab pointer.  All other
 884    arguments are the same.  */
 885 rtx
 886 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
 887                      rtx op1, rtx target, int unsignedp,
 888                      enum optab_methods methods)
 889 {
 890   optab binop = code_to_optab (code);
 891   gcc_assert (binop);
 892
 893   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
 894 }
 895
 896 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
 897    binop.  Order them according to commutative_operand_precedence and, if
 898    possible, try to put TARGET or a pseudo first.  */
 899 static bool
 900 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
 901 {
 902   int op0_prec = commutative_operand_precedence (op0);
 903   int op1_prec = commutative_operand_precedence (op1);
 904
 905   if (op0_prec < op1_prec)
 906     return true;
 907
 908   if (op0_prec > op1_prec)
 909     return false;
 910
 911   /* With equal precedence, both orders are ok, but it is better if the
 912      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
 913   if (target == 0 || REG_P (target))
 914     return (REG_P (op1) && !REG_P (op0)) || target == op1;
 915   else
 916     return rtx_equal_p (op1, target);
 917 }
 918
 919 /* Return true if BINOPTAB implements a shift operation.  */
 920
 921 static bool
 922 shift_optab_p (optab binoptab)
 923 {
 924   switch (optab_to_code (binoptab))
 925     {
 926     case ASHIFT:
 927     case SS_ASHIFT:
 928     case US_ASHIFT:
 929     case ASHIFTRT:
 930     case LSHIFTRT:
 931     case ROTATE:
 932     case ROTATERT:
 933       return true;
 934
 935     default:
 936       return false;
 937     }
 938 }
 939
 940 /* Return true if BINOPTAB implements a commutative binary operation.  */
 941
 942 static bool
 943 commutative_optab_p (optab binoptab)
 944 {
 945   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
 946           || binoptab == smul_widen_optab
 947           || binoptab == umul_widen_optab
 948           || binoptab == smul_highpart_optab
 949           || binoptab == umul_highpart_optab);
 950 }
 951
 952 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
 953    optimizing, and if the operand is a constant that costs more than
 954    1 instruction, force the constant into a register and return that
 955    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
 956
 957 static rtx
 958 avoid_expensive_constant (machine_mode mode, optab binoptab,
 959                           int opn, rtx x, bool unsignedp)
 960 {
 961   bool speed = optimize_insn_for_speed_p ();
 962
 963   if (mode != VOIDmode
 964       && optimize
 965       && CONSTANT_P (x)
 966       && (rtx_cost (x, mode, optab_to_code (binoptab), opn, speed)
 967           > set_src_cost (x, mode, speed)))
 968     {
 969       if (CONST_INT_P (x))
 970         {
 971           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
 972           if (intval != INTVAL (x))
 973             x = GEN_INT (intval);
 974         }
 975       else
 976         x = convert_modes (mode, VOIDmode, x, unsignedp);
 977       x = force_reg (mode, x);
 978     }
 979   return x;
 980 }
 981
 982 /* Helper function for expand_binop: handle the case where there
 983    is an insn that directly implements the indicated operation.
 984    Returns null if this is not possible.  */
 985 static rtx
 986 expand_binop_directly (machine_mode mode, optab binoptab,
 987                        rtx op0, rtx op1,
 988                        rtx target, int unsignedp, enum optab_methods methods,
 989                        rtx_insn *last)
 990 {
 991   machine_mode from_mode = widened_mode (mode, op0, op1);
 992   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
 993                                                       from_mode, 1);
 994   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
 995   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
 996   machine_mode mode0, mode1, tmp_mode;
 997   struct expand_operand ops[3];
 998   bool commutative_p;
 999   rtx_insn *pat;
1000   rtx xop0 = op0, xop1 = op1;
1001   bool canonicalize_op1 = false;
1002
1003   /* If it is a commutative operator and the modes would match
1004      if we would swap the operands, we can save the conversions.  */
1005   commutative_p = commutative_optab_p (binoptab);
1006   if (commutative_p
1007       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1008       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1009     std::swap (xop0, xop1);
1010
1011   /* If we are optimizing, force expensive constants into a register.  */
1012   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1013   if (!shift_optab_p (binoptab))
1014     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1015   else
1016     /* Shifts and rotates often use a different mode for op1 from op0;
1017        for VOIDmode constants we don't know the mode, so force it
1018        to be canonicalized using convert_modes.  */
1019     canonicalize_op1 = true;
1020
1021   /* In case the insn wants input operands in modes different from
1022      those of the actual operands, convert the operands.  It would
1023      seem that we don't need to convert CONST_INTs, but we do, so
1024      that they're properly zero-extended, sign-extended or truncated
1025      for their mode.  */
1026
1027   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1028   if (xmode0 != VOIDmode && xmode0 != mode0)
1029     {
1030       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1031       mode0 = xmode0;
1032     }
1033
1034   mode1 = ((GET_MODE (xop1) != VOIDmode || canonicalize_op1)
1035            ? GET_MODE (xop1) : mode);
1036   if (xmode1 != VOIDmode && xmode1 != mode1)
1037     {
1038       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1039       mode1 = xmode1;
1040     }
1041
1042   /* If operation is commutative,
1043      try to make the first operand a register.
1044      Even better, try to make it the same as the target.
1045      Also try to make the last operand a constant.  */
1046   if (commutative_p
1047       && swap_commutative_operands_with_target (target, xop0, xop1))
1048     std::swap (xop0, xop1);
1049
1050   /* Now, if insn's predicates don't allow our operands, put them into
1051      pseudo regs.  */
1052
1053   if (binoptab == vec_pack_trunc_optab
1054       || binoptab == vec_pack_usat_optab
1055       || binoptab == vec_pack_ssat_optab
1056       || binoptab == vec_pack_ufix_trunc_optab
1057       || binoptab == vec_pack_sfix_trunc_optab)
1058     {
1059       /* The mode of the result is different then the mode of the
1060          arguments.  */
1061       tmp_mode = insn_data[(int) icode].operand[0].mode;
1062       if (VECTOR_MODE_P (mode)
1063           && GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1064         {
1065           delete_insns_since (last);
1066           return NULL_RTX;
1067         }
1068     }
1069   else
1070     tmp_mode = mode;
1071
1072   create_output_operand (&ops[0], target, tmp_mode);
1073   create_input_operand (&ops[1], xop0, mode0);
1074   create_input_operand (&ops[2], xop1, mode1);
1075   pat = maybe_gen_insn (icode, 3, ops);
1076   if (pat)
1077     {
1078       /* If PAT is composed of more than one insn, try to add an appropriate
1079          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1080          operand, call expand_binop again, this time without a target.  */
1081       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1082           && ! add_equal_note (pat, ops[0].value,
1083                                optab_to_code (binoptab),
1084                                ops[1].value, ops[2].value))
1085         {
1086           delete_insns_since (last);
1087           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1088                                unsignedp, methods);
1089         }
1090
1091       emit_insn (pat);
1092       return ops[0].value;
1093     }
1094   delete_insns_since (last);
1095   return NULL_RTX;
1096 }
1097
1098 /* Generate code to perform an operation specified by BINOPTAB
1099    on operands OP0 and OP1, with result having machine-mode MODE.
1100
1101    UNSIGNEDP is for the case where we have to widen the operands
1102    to perform the operation.  It says to use zero-extension.
1103
1104    If TARGET is nonzero, the value
1105    is generated there, if it is convenient to do so.
1106    In all cases an rtx is returned for the locus of the value;
1107    this may or may not be TARGET.  */
1108
1109 rtx
1110 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1111               rtx target, int unsignedp, enum optab_methods methods)
1112 {
1113   enum optab_methods next_methods
1114     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1115        ? OPTAB_WIDEN : methods);
1116   enum mode_class mclass;
1117   machine_mode wider_mode;
1118   scalar_int_mode int_mode;
1119   rtx libfunc;
1120   rtx temp;
1121   rtx_insn *entry_last = get_last_insn ();
1122   rtx_insn *last;
1123
1124   mclass = GET_MODE_CLASS (mode);
1125
1126   /* If subtracting an integer constant, convert this into an addition of
1127      the negated constant.  */
1128
1129   if (binoptab == sub_optab && CONST_INT_P (op1))
1130     {
1131       op1 = negate_rtx (mode, op1);
1132       binoptab = add_optab;
1133     }
1134   /* For shifts, constant invalid op1 might be expanded from different
1135      mode than MODE.  As those are invalid, force them to a register
1136      to avoid further problems during expansion.  */
1137   else if (CONST_INT_P (op1)
1138            && shift_optab_p (binoptab)
1139            && UINTVAL (op1) >= GET_MODE_BITSIZE (GET_MODE_INNER (mode)))
1140     {
1141       op1 = gen_int_mode (INTVAL (op1), GET_MODE_INNER (mode));
1142       op1 = force_reg (GET_MODE_INNER (mode), op1);
1143     }
1144
1145   /* Record where to delete back to if we backtrack.  */
1146   last = get_last_insn ();
1147
1148   /* If we can do it with a three-operand insn, do so.  */
1149
1150   if (methods != OPTAB_MUST_WIDEN
1151       && find_widening_optab_handler (binoptab, mode,
1152                                       widened_mode (mode, op0, op1), 1)
1153             != CODE_FOR_nothing)
1154     {
1155       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1156                                     unsignedp, methods, last);
1157       if (temp)
1158         return temp;
1159     }
1160
1161   /* If we were trying to rotate, and that didn't work, try rotating
1162      the other direction before falling back to shifts and bitwise-or.  */
1163   if (((binoptab == rotl_optab
1164         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1165        || (binoptab == rotr_optab
1166            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1167       && is_int_mode (mode, &int_mode))
1168     {
1169       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1170       rtx newop1;
1171       unsigned int bits = GET_MODE_PRECISION (int_mode);
1172
1173       if (CONST_INT_P (op1))
1174         newop1 = GEN_INT (bits - INTVAL (op1));
1175       else if (targetm.shift_truncation_mask (int_mode) == bits - 1)
1176         newop1 = negate_rtx (GET_MODE (op1), op1);
1177       else
1178         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1179                                gen_int_mode (bits, GET_MODE (op1)), op1,
1180                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1181
1182       temp = expand_binop_directly (int_mode, otheroptab, op0, newop1,
1183                                     target, unsignedp, methods, last);
1184       if (temp)
1185         return temp;
1186     }
1187
1188   /* If this is a multiply, see if we can do a widening operation that
1189      takes operands of this mode and makes a wider mode.  */
1190
1191   if (binoptab == smul_optab
1192       && GET_MODE_2XWIDER_MODE (mode).exists (&wider_mode)
1193       && (convert_optab_handler ((unsignedp
1194                                   ? umul_widen_optab
1195                                   : smul_widen_optab),
1196                                  wider_mode, mode) != CODE_FOR_nothing))
1197     {
1198       temp = expand_binop (wider_mode,
1199                            unsignedp ? umul_widen_optab : smul_widen_optab,
1200                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1201
1202       if (temp != 0)
1203         {
1204           if (GET_MODE_CLASS (mode) == MODE_INT
1205               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1206             return gen_lowpart (mode, temp);
1207           else
1208             return convert_to_mode (mode, temp, unsignedp);
1209         }
1210     }
1211
1212   /* If this is a vector shift by a scalar, see if we can do a vector
1213      shift by a vector.  If so, broadcast the scalar into a vector.  */
1214   if (mclass == MODE_VECTOR_INT)
1215     {
1216       optab otheroptab = unknown_optab;
1217
1218       if (binoptab == ashl_optab)
1219         otheroptab = vashl_optab;
1220       else if (binoptab == ashr_optab)
1221         otheroptab = vashr_optab;
1222       else if (binoptab == lshr_optab)
1223         otheroptab = vlshr_optab;
1224       else if (binoptab == rotl_optab)
1225         otheroptab = vrotl_optab;
1226       else if (binoptab == rotr_optab)
1227         otheroptab = vrotr_optab;
1228
1229       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1230         {
1231           /* The scalar may have been extended to be too wide.  Truncate
1232              it back to the proper size to fit in the broadcast vector.  */
1233           machine_mode inner_mode = GET_MODE_INNER (mode);
1234           if (!CONST_INT_P (op1)
1235               && (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (op1)))
1236                   > GET_MODE_BITSIZE (inner_mode)))
1237             op1 = force_reg (inner_mode,
1238                              simplify_gen_unary (TRUNCATE, inner_mode, op1,
1239                                                  GET_MODE (op1)));
1240           rtx vop1 = expand_vector_broadcast (mode, op1);
1241           if (vop1)
1242             {
1243               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1244                                             target, unsignedp, methods, last);
1245               if (temp)
1246                 return temp;
1247             }
1248         }
1249     }
1250
1251   /* Look for a wider mode of the same class for which we think we
1252      can open-code the operation.  Check for a widening multiply at the
1253      wider mode as well.  */
1254
1255   if (CLASS_HAS_WIDER_MODES_P (mclass)
1256       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1257     FOR_EACH_WIDER_MODE (wider_mode, mode)
1258       {
1259         machine_mode next_mode;
1260         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1261             || (binoptab == smul_optab
1262                 && GET_MODE_WIDER_MODE (wider_mode).exists (&next_mode)
1263                 && (find_widening_optab_handler ((unsignedp
1264                                                   ? umul_widen_optab
1265                                                   : smul_widen_optab),
1266                                                  next_mode, mode, 0)
1267                     != CODE_FOR_nothing)))
1268           {
1269             rtx xop0 = op0, xop1 = op1;
1270             int no_extend = 0;
1271
1272             /* For certain integer operations, we need not actually extend
1273                the narrow operands, as long as we will truncate
1274                the results to the same narrowness.  */
1275
1276             if ((binoptab == ior_optab || binoptab == and_optab
1277                  || binoptab == xor_optab
1278                  || binoptab == add_optab || binoptab == sub_optab
1279                  || binoptab == smul_optab || binoptab == ashl_optab)
1280                 && mclass == MODE_INT)
1281               {
1282                 no_extend = 1;
1283                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1284                                                  xop0, unsignedp);
1285                 if (binoptab != ashl_optab)
1286                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1287                                                    xop1, unsignedp);
1288               }
1289
1290             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1291
1292             /* The second operand of a shift must always be extended.  */
1293             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1294                                   no_extend && binoptab != ashl_optab);
1295
1296             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1297                                  unsignedp, OPTAB_DIRECT);
1298             if (temp)
1299               {
1300                 if (mclass != MODE_INT
1301                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1302                   {
1303                     if (target == 0)
1304                       target = gen_reg_rtx (mode);
1305                     convert_move (target, temp, 0);
1306                     return target;
1307                   }
1308                 else
1309                   return gen_lowpart (mode, temp);
1310               }
1311             else
1312               delete_insns_since (last);
1313           }
1314       }
1315
1316   /* If operation is commutative,
1317      try to make the first operand a register.
1318      Even better, try to make it the same as the target.
1319      Also try to make the last operand a constant.  */
1320   if (commutative_optab_p (binoptab)
1321       && swap_commutative_operands_with_target (target, op0, op1))
1322     std::swap (op0, op1);
1323
1324   /* These can be done a word at a time.  */
1325   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1326       && is_int_mode (mode, &int_mode)
1327       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
1328       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1329     {
1330       int i;
1331       rtx_insn *insns;
1332
1333       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1334          won't be accurate, so use a new target.  */
1335       if (target == 0
1336           || target == op0
1337           || target == op1
1338           || !valid_multiword_target_p (target))
1339         target = gen_reg_rtx (int_mode);
1340
1341       start_sequence ();
1342
1343       /* Do the actual arithmetic.  */
1344       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
1345         {
1346           rtx target_piece = operand_subword (target, i, 1, int_mode);
1347           rtx x = expand_binop (word_mode, binoptab,
1348                                 operand_subword_force (op0, i, int_mode),
1349                                 operand_subword_force (op1, i, int_mode),
1350                                 target_piece, unsignedp, next_methods);
1351
1352           if (x == 0)
1353             break;
1354
1355           if (target_piece != x)
1356             emit_move_insn (target_piece, x);
1357         }
1358
1359       insns = get_insns ();
1360       end_sequence ();
1361
1362       if (i == GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD)
1363         {
1364           emit_insn (insns);
1365           return target;
1366         }
1367     }
1368
1369   /* Synthesize double word shifts from single word shifts.  */
1370   if ((binoptab == lshr_optab || binoptab == ashl_optab
1371        || binoptab == ashr_optab)
1372       && is_int_mode (mode, &int_mode)
1373       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1374       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1375       && GET_MODE_PRECISION (int_mode) == GET_MODE_BITSIZE (int_mode)
1376       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1377       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1378       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1379     {
1380       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1381       scalar_int_mode op1_mode;
1382
1383       double_shift_mask = targetm.shift_truncation_mask (int_mode);
1384       shift_mask = targetm.shift_truncation_mask (word_mode);
1385       op1_mode = (GET_MODE (op1) != VOIDmode
1386                   ? as_a <scalar_int_mode> (GET_MODE (op1))
1387                   : word_mode);
1388
1389       /* Apply the truncation to constant shifts.  */
1390       if (double_shift_mask > 0 && CONST_INT_P (op1))
1391         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1392
1393       if (op1 == CONST0_RTX (op1_mode))
1394         return op0;
1395
1396       /* Make sure that this is a combination that expand_doubleword_shift
1397          can handle.  See the comments there for details.  */
1398       if (double_shift_mask == 0
1399           || (shift_mask == BITS_PER_WORD - 1
1400               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1401         {
1402           rtx_insn *insns;
1403           rtx into_target, outof_target;
1404           rtx into_input, outof_input;
1405           int left_shift, outof_word;
1406
1407           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1408              won't be accurate, so use a new target.  */
1409           if (target == 0
1410               || target == op0
1411               || target == op1
1412               || !valid_multiword_target_p (target))
1413             target = gen_reg_rtx (int_mode);
1414
1415           start_sequence ();
1416
1417           /* OUTOF_* is the word we are shifting bits away from, and
1418              INTO_* is the word that we are shifting bits towards, thus
1419              they differ depending on the direction of the shift and
1420              WORDS_BIG_ENDIAN.  */
1421
1422           left_shift = binoptab == ashl_optab;
1423           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1424
1425           outof_target = operand_subword (target, outof_word, 1, int_mode);
1426           into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1427
1428           outof_input = operand_subword_force (op0, outof_word, int_mode);
1429           into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1430
1431           if (expand_doubleword_shift (op1_mode, binoptab,
1432                                        outof_input, into_input, op1,
1433                                        outof_target, into_target,
1434                                        unsignedp, next_methods, shift_mask))
1435             {
1436               insns = get_insns ();
1437               end_sequence ();
1438
1439               emit_insn (insns);
1440               return target;
1441             }
1442           end_sequence ();
1443         }
1444     }
1445
1446   /* Synthesize double word rotates from single word shifts.  */
1447   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1448       && is_int_mode (mode, &int_mode)
1449       && CONST_INT_P (op1)
1450       && GET_MODE_PRECISION (int_mode) == 2 * BITS_PER_WORD
1451       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1452       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1453     {
1454       rtx_insn *insns;
1455       rtx into_target, outof_target;
1456       rtx into_input, outof_input;
1457       rtx inter;
1458       int shift_count, left_shift, outof_word;
1459
1460       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1461          won't be accurate, so use a new target. Do this also if target is not
1462          a REG, first because having a register instead may open optimization
1463          opportunities, and second because if target and op0 happen to be MEMs
1464          designating the same location, we would risk clobbering it too early
1465          in the code sequence we generate below.  */
1466       if (target == 0
1467           || target == op0
1468           || target == op1
1469           || !REG_P (target)
1470           || !valid_multiword_target_p (target))
1471         target = gen_reg_rtx (int_mode);
1472
1473       start_sequence ();
1474
1475       shift_count = INTVAL (op1);
1476
1477       /* OUTOF_* is the word we are shifting bits away from, and
1478          INTO_* is the word that we are shifting bits towards, thus
1479          they differ depending on the direction of the shift and
1480          WORDS_BIG_ENDIAN.  */
1481
1482       left_shift = (binoptab == rotl_optab);
1483       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1484
1485       outof_target = operand_subword (target, outof_word, 1, int_mode);
1486       into_target = operand_subword (target, 1 - outof_word, 1, int_mode);
1487
1488       outof_input = operand_subword_force (op0, outof_word, int_mode);
1489       into_input = operand_subword_force (op0, 1 - outof_word, int_mode);
1490
1491       if (shift_count == BITS_PER_WORD)
1492         {
1493           /* This is just a word swap.  */
1494           emit_move_insn (outof_target, into_input);
1495           emit_move_insn (into_target, outof_input);
1496           inter = const0_rtx;
1497         }
1498       else
1499         {
1500           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1501           rtx first_shift_count, second_shift_count;
1502           optab reverse_unsigned_shift, unsigned_shift;
1503
1504           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1505                                     ? lshr_optab : ashl_optab);
1506
1507           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1508                             ? ashl_optab : lshr_optab);
1509
1510           if (shift_count > BITS_PER_WORD)
1511             {
1512               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1513               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1514             }
1515           else
1516             {
1517               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1518               second_shift_count = GEN_INT (shift_count);
1519             }
1520
1521           into_temp1 = expand_binop (word_mode, unsigned_shift,
1522                                      outof_input, first_shift_count,
1523                                      NULL_RTX, unsignedp, next_methods);
1524           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1525                                      into_input, second_shift_count,
1526                                      NULL_RTX, unsignedp, next_methods);
1527
1528           if (into_temp1 != 0 && into_temp2 != 0)
1529             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1530                                   into_target, unsignedp, next_methods);
1531           else
1532             inter = 0;
1533
1534           if (inter != 0 && inter != into_target)
1535             emit_move_insn (into_target, inter);
1536
1537           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1538                                       into_input, first_shift_count,
1539                                       NULL_RTX, unsignedp, next_methods);
1540           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1541                                       outof_input, second_shift_count,
1542                                       NULL_RTX, unsignedp, next_methods);
1543
1544           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1545             inter = expand_binop (word_mode, ior_optab,
1546                                   outof_temp1, outof_temp2,
1547                                   outof_target, unsignedp, next_methods);
1548
1549           if (inter != 0 && inter != outof_target)
1550             emit_move_insn (outof_target, inter);
1551         }
1552
1553       insns = get_insns ();
1554       end_sequence ();
1555
1556       if (inter != 0)
1557         {
1558           emit_insn (insns);
1559           return target;
1560         }
1561     }
1562
1563   /* These can be done a word at a time by propagating carries.  */
1564   if ((binoptab == add_optab || binoptab == sub_optab)
1565       && is_int_mode (mode, &int_mode)
1566       && GET_MODE_SIZE (int_mode) >= 2 * UNITS_PER_WORD
1567       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1568     {
1569       unsigned int i;
1570       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1571       const unsigned int nwords = GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD;
1572       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1573       rtx xop0, xop1, xtarget;
1574
1575       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1576          value is one of those, use it.  Otherwise, use 1 since it is the
1577          one easiest to get.  */
1578 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1579       int normalizep = STORE_FLAG_VALUE;
1580 #else
1581       int normalizep = 1;
1582 #endif
1583
1584       /* Prepare the operands.  */
1585       xop0 = force_reg (int_mode, op0);
1586       xop1 = force_reg (int_mode, op1);
1587
1588       xtarget = gen_reg_rtx (int_mode);
1589
1590       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1591         target = xtarget;
1592
1593       /* Indicate for flow that the entire target reg is being set.  */
1594       if (REG_P (target))
1595         emit_clobber (xtarget);
1596
1597       /* Do the actual arithmetic.  */
1598       for (i = 0; i < nwords; i++)
1599         {
1600           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1601           rtx target_piece = operand_subword (xtarget, index, 1, int_mode);
1602           rtx op0_piece = operand_subword_force (xop0, index, int_mode);
1603           rtx op1_piece = operand_subword_force (xop1, index, int_mode);
1604           rtx x;
1605
1606           /* Main add/subtract of the input operands.  */
1607           x = expand_binop (word_mode, binoptab,
1608                             op0_piece, op1_piece,
1609                             target_piece, unsignedp, next_methods);
1610           if (x == 0)
1611             break;
1612
1613           if (i + 1 < nwords)
1614             {
1615               /* Store carry from main add/subtract.  */
1616               carry_out = gen_reg_rtx (word_mode);
1617               carry_out = emit_store_flag_force (carry_out,
1618                                                  (binoptab == add_optab
1619                                                   ? LT : GT),
1620                                                  x, op0_piece,
1621                                                  word_mode, 1, normalizep);
1622             }
1623
1624           if (i > 0)
1625             {
1626               rtx newx;
1627
1628               /* Add/subtract previous carry to main result.  */
1629               newx = expand_binop (word_mode,
1630                                    normalizep == 1 ? binoptab : otheroptab,
1631                                    x, carry_in,
1632                                    NULL_RTX, 1, next_methods);
1633
1634               if (i + 1 < nwords)
1635                 {
1636                   /* Get out carry from adding/subtracting carry in.  */
1637                   rtx carry_tmp = gen_reg_rtx (word_mode);
1638                   carry_tmp = emit_store_flag_force (carry_tmp,
1639                                                      (binoptab == add_optab
1640                                                       ? LT : GT),
1641                                                      newx, x,
1642                                                      word_mode, 1, normalizep);
1643
1644                   /* Logical-ior the two poss. carry together.  */
1645                   carry_out = expand_binop (word_mode, ior_optab,
1646                                             carry_out, carry_tmp,
1647                                             carry_out, 0, next_methods);
1648                   if (carry_out == 0)
1649                     break;
1650                 }
1651               emit_move_insn (target_piece, newx);
1652             }
1653           else
1654             {
1655               if (x != target_piece)
1656                 emit_move_insn (target_piece, x);
1657             }
1658
1659           carry_in = carry_out;
1660         }
1661
1662       if (i == GET_MODE_BITSIZE (int_mode) / (unsigned) BITS_PER_WORD)
1663         {
1664           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing
1665               || ! rtx_equal_p (target, xtarget))
1666             {
1667               rtx_insn *temp = emit_move_insn (target, xtarget);
1668
1669               set_dst_reg_note (temp, REG_EQUAL,
1670                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
1671                                                 int_mode, copy_rtx (xop0),
1672                                                 copy_rtx (xop1)),
1673                                 target);
1674             }
1675           else
1676             target = xtarget;
1677
1678           return target;
1679         }
1680
1681       else
1682         delete_insns_since (last);
1683     }
1684
1685   /* Attempt to synthesize double word multiplies using a sequence of word
1686      mode multiplications.  We first attempt to generate a sequence using a
1687      more efficient unsigned widening multiply, and if that fails we then
1688      try using a signed widening multiply.  */
1689
1690   if (binoptab == smul_optab
1691       && is_int_mode (mode, &int_mode)
1692       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
1693       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
1694       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
1695     {
1696       rtx product = NULL_RTX;
1697       if (widening_optab_handler (umul_widen_optab, int_mode, word_mode)
1698           != CODE_FOR_nothing)
1699         {
1700           product = expand_doubleword_mult (int_mode, op0, op1, target,
1701                                             true, methods);
1702           if (!product)
1703             delete_insns_since (last);
1704         }
1705
1706       if (product == NULL_RTX
1707           && (widening_optab_handler (smul_widen_optab, int_mode, word_mode)
1708               != CODE_FOR_nothing))
1709         {
1710           product = expand_doubleword_mult (int_mode, op0, op1, target,
1711                                             false, methods);
1712           if (!product)
1713             delete_insns_since (last);
1714         }
1715
1716       if (product != NULL_RTX)
1717         {
1718           if (optab_handler (mov_optab, int_mode) != CODE_FOR_nothing)
1719             {
1720               rtx_insn *move = emit_move_insn (target ? target : product,
1721                                                product);
1722               set_dst_reg_note (move,
1723                                 REG_EQUAL,
1724                                 gen_rtx_fmt_ee (MULT, int_mode,
1725                                                 copy_rtx (op0),
1726                                                 copy_rtx (op1)),
1727                                 target ? target : product);
1728             }
1729           return product;
1730         }
1731     }
1732
1733   /* It can't be open-coded in this mode.
1734      Use a library call if one is available and caller says that's ok.  */
1735
1736   libfunc = optab_libfunc (binoptab, mode);
1737   if (libfunc
1738       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
1739     {
1740       rtx_insn *insns;
1741       rtx op1x = op1;
1742       machine_mode op1_mode = mode;
1743       rtx value;
1744
1745       start_sequence ();
1746
1747       if (shift_optab_p (binoptab))
1748         {
1749           op1_mode = targetm.libgcc_shift_count_mode ();
1750           /* Specify unsigned here,
1751              since negative shift counts are meaningless.  */
1752           op1x = convert_to_mode (op1_mode, op1, 1);
1753         }
1754
1755       if (GET_MODE (op0) != VOIDmode
1756           && GET_MODE (op0) != mode)
1757         op0 = convert_to_mode (mode, op0, unsignedp);
1758
1759       /* Pass 1 for NO_QUEUE so we don't lose any increments
1760          if the libcall is cse'd or moved.  */
1761       value = emit_library_call_value (libfunc,
1762                                        NULL_RTX, LCT_CONST, mode, 2,
1763                                        op0, mode, op1x, op1_mode);
1764
1765       insns = get_insns ();
1766       end_sequence ();
1767
1768       bool trapv = trapv_binoptab_p (binoptab);
1769       target = gen_reg_rtx (mode);
1770       emit_libcall_block_1 (insns, target, value,
1771                             trapv ? NULL_RTX
1772                             : gen_rtx_fmt_ee (optab_to_code (binoptab),
1773                                               mode, op0, op1), trapv);
1774
1775       return target;
1776     }
1777
1778   delete_insns_since (last);
1779
1780   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1781
1782   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
1783          || methods == OPTAB_MUST_WIDEN))
1784     {
1785       /* Caller says, don't even try.  */
1786       delete_insns_since (entry_last);
1787       return 0;
1788     }
1789
1790   /* Compute the value of METHODS to pass to recursive calls.
1791      Don't allow widening to be tried recursively.  */
1792
1793   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
1794
1795   /* Look for a wider mode of the same class for which it appears we can do
1796      the operation.  */
1797
1798   if (CLASS_HAS_WIDER_MODES_P (mclass))
1799     {
1800       FOR_EACH_WIDER_MODE (wider_mode, mode)
1801         {
1802           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
1803                   != CODE_FOR_nothing
1804               || (methods == OPTAB_LIB
1805                   && optab_libfunc (binoptab, wider_mode)))
1806             {
1807               rtx xop0 = op0, xop1 = op1;
1808               int no_extend = 0;
1809
1810               /* For certain integer operations, we need not actually extend
1811                  the narrow operands, as long as we will truncate
1812                  the results to the same narrowness.  */
1813
1814               if ((binoptab == ior_optab || binoptab == and_optab
1815                    || binoptab == xor_optab
1816                    || binoptab == add_optab || binoptab == sub_optab
1817                    || binoptab == smul_optab || binoptab == ashl_optab)
1818                   && mclass == MODE_INT)
1819                 no_extend = 1;
1820
1821               xop0 = widen_operand (xop0, wider_mode, mode,
1822                                     unsignedp, no_extend);
1823
1824               /* The second operand of a shift must always be extended.  */
1825               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1826                                     no_extend && binoptab != ashl_optab);
1827
1828               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1829                                    unsignedp, methods);
1830               if (temp)
1831                 {
1832                   if (mclass != MODE_INT
1833                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1834                     {
1835                       if (target == 0)
1836                         target = gen_reg_rtx (mode);
1837                       convert_move (target, temp, 0);
1838                       return target;
1839                     }
1840                   else
1841                     return gen_lowpart (mode, temp);
1842                 }
1843               else
1844                 delete_insns_since (last);
1845             }
1846         }
1847     }
1848
1849   delete_insns_since (entry_last);
1850   return 0;
1851 }
1852 \f
1853 /* Expand a binary operator which has both signed and unsigned forms.
1854    UOPTAB is the optab for unsigned operations, and SOPTAB is for
1855    signed operations.
1856
1857    If we widen unsigned operands, we may use a signed wider operation instead
1858    of an unsigned wider operation, since the result would be the same.  */
1859
1860 rtx
1861 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
1862                    rtx op0, rtx op1, rtx target, int unsignedp,
1863                    enum optab_methods methods)
1864 {
1865   rtx temp;
1866   optab direct_optab = unsignedp ? uoptab : soptab;
1867   bool save_enable;
1868
1869   /* Do it without widening, if possible.  */
1870   temp = expand_binop (mode, direct_optab, op0, op1, target,
1871                        unsignedp, OPTAB_DIRECT);
1872   if (temp || methods == OPTAB_DIRECT)
1873     return temp;
1874
1875   /* Try widening to a signed int.  Disable any direct use of any
1876      signed insn in the current mode.  */
1877   save_enable = swap_optab_enable (soptab, mode, false);
1878
1879   temp = expand_binop (mode, soptab, op0, op1, target,
1880                        unsignedp, OPTAB_WIDEN);
1881
1882   /* For unsigned operands, try widening to an unsigned int.  */
1883   if (!temp && unsignedp)
1884     temp = expand_binop (mode, uoptab, op0, op1, target,
1885                          unsignedp, OPTAB_WIDEN);
1886   if (temp || methods == OPTAB_WIDEN)
1887     goto egress;
1888
1889   /* Use the right width libcall if that exists.  */
1890   temp = expand_binop (mode, direct_optab, op0, op1, target,
1891                        unsignedp, OPTAB_LIB);
1892   if (temp || methods == OPTAB_LIB)
1893     goto egress;
1894
1895   /* Must widen and use a libcall, use either signed or unsigned.  */
1896   temp = expand_binop (mode, soptab, op0, op1, target,
1897                        unsignedp, methods);
1898   if (!temp && unsignedp)
1899     temp = expand_binop (mode, uoptab, op0, op1, target,
1900                          unsignedp, methods);
1901
1902  egress:
1903   /* Undo the fiddling above.  */
1904   if (save_enable)
1905     swap_optab_enable (soptab, mode, true);
1906   return temp;
1907 }
1908 \f
1909 /* Generate code to perform an operation specified by UNOPPTAB
1910    on operand OP0, with two results to TARG0 and TARG1.
1911    We assume that the order of the operands for the instruction
1912    is TARG0, TARG1, OP0.
1913
1914    Either TARG0 or TARG1 may be zero, but what that means is that
1915    the result is not actually wanted.  We will generate it into
1916    a dummy pseudo-reg and discard it.  They may not both be zero.
1917
1918    Returns 1 if this operation can be performed; 0 if not.  */
1919
1920 int
1921 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
1922                     int unsignedp)
1923 {
1924   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1925   enum mode_class mclass;
1926   machine_mode wider_mode;
1927   rtx_insn *entry_last = get_last_insn ();
1928   rtx_insn *last;
1929
1930   mclass = GET_MODE_CLASS (mode);
1931
1932   if (!targ0)
1933     targ0 = gen_reg_rtx (mode);
1934   if (!targ1)
1935     targ1 = gen_reg_rtx (mode);
1936
1937   /* Record where to go back to if we fail.  */
1938   last = get_last_insn ();
1939
1940   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
1941     {
1942       struct expand_operand ops[3];
1943       enum insn_code icode = optab_handler (unoptab, mode);
1944
1945       create_fixed_operand (&ops[0], targ0);
1946       create_fixed_operand (&ops[1], targ1);
1947       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
1948       if (maybe_expand_insn (icode, 3, ops))
1949         return 1;
1950     }
1951
1952   /* It can't be done in this mode.  Can we do it in a wider mode?  */
1953
1954   if (CLASS_HAS_WIDER_MODES_P (mclass))
1955     {
1956       FOR_EACH_WIDER_MODE (wider_mode, mode)
1957         {
1958           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
1959             {
1960               rtx t0 = gen_reg_rtx (wider_mode);
1961               rtx t1 = gen_reg_rtx (wider_mode);
1962               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
1963
1964               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
1965                 {
1966                   convert_move (targ0, t0, unsignedp);
1967                   convert_move (targ1, t1, unsignedp);
1968                   return 1;
1969                 }
1970               else
1971                 delete_insns_since (last);
1972             }
1973         }
1974     }
1975
1976   delete_insns_since (entry_last);
1977   return 0;
1978 }
1979 \f
1980 /* Generate code to perform an operation specified by BINOPTAB
1981    on operands OP0 and OP1, with two results to TARG1 and TARG2.
1982    We assume that the order of the operands for the instruction
1983    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
1984    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
1985
1986    Either TARG0 or TARG1 may be zero, but what that means is that
1987    the result is not actually wanted.  We will generate it into
1988    a dummy pseudo-reg and discard it.  They may not both be zero.
1989
1990    Returns 1 if this operation can be performed; 0 if not.  */
1991
1992 int
1993 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
1994                      int unsignedp)
1995 {
1996   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
1997   enum mode_class mclass;
1998   machine_mode wider_mode;
1999   rtx_insn *entry_last = get_last_insn ();
2000   rtx_insn *last;
2001
2002   mclass = GET_MODE_CLASS (mode);
2003
2004   if (!targ0)
2005     targ0 = gen_reg_rtx (mode);
2006   if (!targ1)
2007     targ1 = gen_reg_rtx (mode);
2008
2009   /* Record where to go back to if we fail.  */
2010   last = get_last_insn ();
2011
2012   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2013     {
2014       struct expand_operand ops[4];
2015       enum insn_code icode = optab_handler (binoptab, mode);
2016       machine_mode mode0 = insn_data[icode].operand[1].mode;
2017       machine_mode mode1 = insn_data[icode].operand[2].mode;
2018       rtx xop0 = op0, xop1 = op1;
2019
2020       /* If we are optimizing, force expensive constants into a register.  */
2021       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2022       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2023
2024       create_fixed_operand (&ops[0], targ0);
2025       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2026       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2027       create_fixed_operand (&ops[3], targ1);
2028       if (maybe_expand_insn (icode, 4, ops))
2029         return 1;
2030       delete_insns_since (last);
2031     }
2032
2033   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2034
2035   if (CLASS_HAS_WIDER_MODES_P (mclass))
2036     {
2037       FOR_EACH_WIDER_MODE (wider_mode, mode)
2038         {
2039           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2040             {
2041               rtx t0 = gen_reg_rtx (wider_mode);
2042               rtx t1 = gen_reg_rtx (wider_mode);
2043               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2044               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2045
2046               if (expand_twoval_binop (binoptab, cop0, cop1,
2047                                        t0, t1, unsignedp))
2048                 {
2049                   convert_move (targ0, t0, unsignedp);
2050                   convert_move (targ1, t1, unsignedp);
2051                   return 1;
2052                 }
2053               else
2054                 delete_insns_since (last);
2055             }
2056         }
2057     }
2058
2059   delete_insns_since (entry_last);
2060   return 0;
2061 }
2062
2063 /* Expand the two-valued library call indicated by BINOPTAB, but
2064    preserve only one of the values.  If TARG0 is non-NULL, the first
2065    value is placed into TARG0; otherwise the second value is placed
2066    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2067    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2068    This routine assumes that the value returned by the library call is
2069    as if the return value was of an integral mode twice as wide as the
2070    mode of OP0.  Returns 1 if the call was successful.  */
2071
2072 bool
2073 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2074                              rtx targ0, rtx targ1, enum rtx_code code)
2075 {
2076   machine_mode mode;
2077   machine_mode libval_mode;
2078   rtx libval;
2079   rtx_insn *insns;
2080   rtx libfunc;
2081
2082   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2083   gcc_assert (!targ0 != !targ1);
2084
2085   mode = GET_MODE (op0);
2086   libfunc = optab_libfunc (binoptab, mode);
2087   if (!libfunc)
2088     return false;
2089
2090   /* The value returned by the library function will have twice as
2091      many bits as the nominal MODE.  */
2092   libval_mode = smallest_int_mode_for_size (2 * GET_MODE_BITSIZE (mode));
2093   start_sequence ();
2094   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2095                                     libval_mode, 2,
2096                                     op0, mode,
2097                                     op1, mode);
2098   /* Get the part of VAL containing the value that we want.  */
2099   libval = simplify_gen_subreg (mode, libval, libval_mode,
2100                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2101   insns = get_insns ();
2102   end_sequence ();
2103   /* Move the into the desired location.  */
2104   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2105                       gen_rtx_fmt_ee (code, mode, op0, op1));
2106
2107   return true;
2108 }
2109
2110 \f
2111 /* Wrapper around expand_unop which takes an rtx code to specify
2112    the operation to perform, not an optab pointer.  All other
2113    arguments are the same.  */
2114 rtx
2115 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2116                     rtx target, int unsignedp)
2117 {
2118   optab unop = code_to_optab (code);
2119   gcc_assert (unop);
2120
2121   return expand_unop (mode, unop, op0, target, unsignedp);
2122 }
2123
2124 /* Try calculating
2125         (clz:narrow x)
2126    as
2127         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2128
2129    A similar operation can be used for clrsb.  UNOPTAB says which operation
2130    we are trying to expand.  */
2131 static rtx
2132 widen_leading (scalar_int_mode mode, rtx op0, rtx target, optab unoptab)
2133 {
2134   opt_scalar_int_mode wider_mode_iter;
2135   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2136     {
2137       scalar_int_mode wider_mode = wider_mode_iter.require ();
2138       if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2139         {
2140           rtx xop0, temp;
2141           rtx_insn *last;
2142
2143           last = get_last_insn ();
2144
2145           if (target == 0)
2146             target = gen_reg_rtx (mode);
2147           xop0 = widen_operand (op0, wider_mode, mode,
2148                                 unoptab != clrsb_optab, false);
2149           temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2150                               unoptab != clrsb_optab);
2151           if (temp != 0)
2152             temp = expand_binop
2153               (wider_mode, sub_optab, temp,
2154                gen_int_mode (GET_MODE_PRECISION (wider_mode)
2155                              - GET_MODE_PRECISION (mode),
2156                              wider_mode),
2157                target, true, OPTAB_DIRECT);
2158           if (temp == 0)
2159             delete_insns_since (last);
2160
2161           return temp;
2162         }
2163     }
2164   return 0;
2165 }
2166
2167 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2168    quantities, choosing which based on whether the high word is nonzero.  */
2169 static rtx
2170 expand_doubleword_clz (scalar_int_mode mode, rtx op0, rtx target)
2171 {
2172   rtx xop0 = force_reg (mode, op0);
2173   rtx subhi = gen_highpart (word_mode, xop0);
2174   rtx sublo = gen_lowpart (word_mode, xop0);
2175   rtx_code_label *hi0_label = gen_label_rtx ();
2176   rtx_code_label *after_label = gen_label_rtx ();
2177   rtx_insn *seq;
2178   rtx temp, result;
2179
2180   /* If we were not given a target, use a word_mode register, not a
2181      'mode' register.  The result will fit, and nobody is expecting
2182      anything bigger (the return type of __builtin_clz* is int).  */
2183   if (!target)
2184     target = gen_reg_rtx (word_mode);
2185
2186   /* In any case, write to a word_mode scratch in both branches of the
2187      conditional, so we can ensure there is a single move insn setting
2188      'target' to tag a REG_EQUAL note on.  */
2189   result = gen_reg_rtx (word_mode);
2190
2191   start_sequence ();
2192
2193   /* If the high word is not equal to zero,
2194      then clz of the full value is clz of the high word.  */
2195   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2196                            word_mode, true, hi0_label);
2197
2198   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2199   if (!temp)
2200     goto fail;
2201
2202   if (temp != result)
2203     convert_move (result, temp, true);
2204
2205   emit_jump_insn (targetm.gen_jump (after_label));
2206   emit_barrier ();
2207
2208   /* Else clz of the full value is clz of the low word plus the number
2209      of bits in the high word.  */
2210   emit_label (hi0_label);
2211
2212   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2213   if (!temp)
2214     goto fail;
2215   temp = expand_binop (word_mode, add_optab, temp,
2216                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2217                        result, true, OPTAB_DIRECT);
2218   if (!temp)
2219     goto fail;
2220   if (temp != result)
2221     convert_move (result, temp, true);
2222
2223   emit_label (after_label);
2224   convert_move (target, result, true);
2225
2226   seq = get_insns ();
2227   end_sequence ();
2228
2229   add_equal_note (seq, target, CLZ, xop0, 0);
2230   emit_insn (seq);
2231   return target;
2232
2233  fail:
2234   end_sequence ();
2235   return 0;
2236 }
2237
2238 /* Try calculating popcount of a double-word quantity as two popcount's of
2239    word-sized quantities and summing up the results.  */
2240 static rtx
2241 expand_doubleword_popcount (scalar_int_mode mode, rtx op0, rtx target)
2242 {
2243   rtx t0, t1, t;
2244   rtx_insn *seq;
2245
2246   start_sequence ();
2247
2248   t0 = expand_unop_direct (word_mode, popcount_optab,
2249                            operand_subword_force (op0, 0, mode), NULL_RTX,
2250                            true);
2251   t1 = expand_unop_direct (word_mode, popcount_optab,
2252                            operand_subword_force (op0, 1, mode), NULL_RTX,
2253                            true);
2254   if (!t0 || !t1)
2255     {
2256       end_sequence ();
2257       return NULL_RTX;
2258     }
2259
2260   /* If we were not given a target, use a word_mode register, not a
2261      'mode' register.  The result will fit, and nobody is expecting
2262      anything bigger (the return type of __builtin_popcount* is int).  */
2263   if (!target)
2264     target = gen_reg_rtx (word_mode);
2265
2266   t = expand_binop (word_mode, add_optab, t0, t1, target, 0, OPTAB_DIRECT);
2267
2268   seq = get_insns ();
2269   end_sequence ();
2270
2271   add_equal_note (seq, t, POPCOUNT, op0, 0);
2272   emit_insn (seq);
2273   return t;
2274 }
2275
2276 /* Try calculating
2277         (parity:wide x)
2278    as
2279         (parity:narrow (low (x) ^ high (x))) */
2280 static rtx
2281 expand_doubleword_parity (scalar_int_mode mode, rtx op0, rtx target)
2282 {
2283   rtx t = expand_binop (word_mode, xor_optab,
2284                         operand_subword_force (op0, 0, mode),
2285                         operand_subword_force (op0, 1, mode),
2286                         NULL_RTX, 0, OPTAB_DIRECT);
2287   return expand_unop (word_mode, parity_optab, t, target, true);
2288 }
2289
2290 /* Try calculating
2291         (bswap:narrow x)
2292    as
2293         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2294 static rtx
2295 widen_bswap (scalar_int_mode mode, rtx op0, rtx target)
2296 {
2297   rtx x;
2298   rtx_insn *last;
2299   opt_scalar_int_mode wider_mode_iter;
2300
2301   FOR_EACH_WIDER_MODE (wider_mode_iter, mode)
2302     if (optab_handler (bswap_optab, wider_mode_iter.require ())
2303         != CODE_FOR_nothing)
2304       break;
2305
2306   if (!wider_mode_iter.exists ())
2307     return NULL_RTX;
2308
2309   scalar_int_mode wider_mode = wider_mode_iter.require ();
2310   last = get_last_insn ();
2311
2312   x = widen_operand (op0, wider_mode, mode, true, true);
2313   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2314
2315   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2316               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2317   if (x != 0)
2318     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2319                       GET_MODE_BITSIZE (wider_mode)
2320                       - GET_MODE_BITSIZE (mode),
2321                       NULL_RTX, true);
2322
2323   if (x != 0)
2324     {
2325       if (target == 0)
2326         target = gen_reg_rtx (mode);
2327       emit_move_insn (target, gen_lowpart (mode, x));
2328     }
2329   else
2330     delete_insns_since (last);
2331
2332   return target;
2333 }
2334
2335 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2336
2337 static rtx
2338 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2339 {
2340   rtx t0, t1;
2341
2342   t1 = expand_unop (word_mode, bswap_optab,
2343                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2344   t0 = expand_unop (word_mode, bswap_optab,
2345                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2346
2347   if (target == 0 || !valid_multiword_target_p (target))
2348     target = gen_reg_rtx (mode);
2349   if (REG_P (target))
2350     emit_clobber (target);
2351   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2352   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2353
2354   return target;
2355 }
2356
2357 /* Try calculating (parity x) as (and (popcount x) 1), where
2358    popcount can also be done in a wider mode.  */
2359 static rtx
2360 expand_parity (scalar_int_mode mode, rtx op0, rtx target)
2361 {
2362   enum mode_class mclass = GET_MODE_CLASS (mode);
2363   opt_scalar_int_mode wider_mode_iter;
2364   FOR_EACH_MODE_FROM (wider_mode_iter, mode)
2365     {
2366       scalar_int_mode wider_mode = wider_mode_iter.require ();
2367       if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2368         {
2369           rtx xop0, temp;
2370           rtx_insn *last;
2371
2372           last = get_last_insn ();
2373
2374           if (target == 0 || GET_MODE (target) != wider_mode)
2375             target = gen_reg_rtx (wider_mode);
2376
2377           xop0 = widen_operand (op0, wider_mode, mode, true, false);
2378           temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2379                               true);
2380           if (temp != 0)
2381             temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2382                                  target, true, OPTAB_DIRECT);
2383
2384           if (temp)
2385             {
2386               if (mclass != MODE_INT
2387                   || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2388                 return convert_to_mode (mode, temp, 0);
2389               else
2390                 return gen_lowpart (mode, temp);
2391             }
2392           else
2393             delete_insns_since (last);
2394         }
2395     }
2396   return 0;
2397 }
2398
2399 /* Try calculating ctz(x) as K - clz(x & -x) ,
2400    where K is GET_MODE_PRECISION(mode) - 1.
2401
2402    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2403    don't have to worry about what the hardware does in that case.  (If
2404    the clz instruction produces the usual value at 0, which is K, the
2405    result of this code sequence will be -1; expand_ffs, below, relies
2406    on this.  It might be nice to have it be K instead, for consistency
2407    with the (very few) processors that provide a ctz with a defined
2408    value, but that would take one more instruction, and it would be
2409    less convenient for expand_ffs anyway.  */
2410
2411 static rtx
2412 expand_ctz (scalar_int_mode mode, rtx op0, rtx target)
2413 {
2414   rtx_insn *seq;
2415   rtx temp;
2416
2417   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2418     return 0;
2419
2420   start_sequence ();
2421
2422   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2423   if (temp)
2424     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2425                          true, OPTAB_DIRECT);
2426   if (temp)
2427     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2428   if (temp)
2429     temp = expand_binop (mode, sub_optab,
2430                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2431                          temp, target,
2432                          true, OPTAB_DIRECT);
2433   if (temp == 0)
2434     {
2435       end_sequence ();
2436       return 0;
2437     }
2438
2439   seq = get_insns ();
2440   end_sequence ();
2441
2442   add_equal_note (seq, temp, CTZ, op0, 0);
2443   emit_insn (seq);
2444   return temp;
2445 }
2446
2447
2448 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2449    else with the sequence used by expand_clz.
2450
2451    The ffs builtin promises to return zero for a zero value and ctz/clz
2452    may have an undefined value in that case.  If they do not give us a
2453    convenient value, we have to generate a test and branch.  */
2454 static rtx
2455 expand_ffs (scalar_int_mode mode, rtx op0, rtx target)
2456 {
2457   HOST_WIDE_INT val = 0;
2458   bool defined_at_zero = false;
2459   rtx temp;
2460   rtx_insn *seq;
2461
2462   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2463     {
2464       start_sequence ();
2465
2466       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2467       if (!temp)
2468         goto fail;
2469
2470       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2471     }
2472   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2473     {
2474       start_sequence ();
2475       temp = expand_ctz (mode, op0, 0);
2476       if (!temp)
2477         goto fail;
2478
2479       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2480         {
2481           defined_at_zero = true;
2482           val = (GET_MODE_PRECISION (mode) - 1) - val;
2483         }
2484     }
2485   else
2486     return 0;
2487
2488   if (defined_at_zero && val == -1)
2489     /* No correction needed at zero.  */;
2490   else
2491     {
2492       /* We don't try to do anything clever with the situation found
2493          on some processors (eg Alpha) where ctz(0:mode) ==
2494          bitsize(mode).  If someone can think of a way to send N to -1
2495          and leave alone all values in the range 0..N-1 (where N is a
2496          power of two), cheaper than this test-and-branch, please add it.
2497
2498          The test-and-branch is done after the operation itself, in case
2499          the operation sets condition codes that can be recycled for this.
2500          (This is true on i386, for instance.)  */
2501
2502       rtx_code_label *nonzero_label = gen_label_rtx ();
2503       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2504                                mode, true, nonzero_label);
2505
2506       convert_move (temp, GEN_INT (-1), false);
2507       emit_label (nonzero_label);
2508     }
2509
2510   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2511      to produce a value in the range 0..bitsize.  */
2512   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2513                        target, false, OPTAB_DIRECT);
2514   if (!temp)
2515     goto fail;
2516
2517   seq = get_insns ();
2518   end_sequence ();
2519
2520   add_equal_note (seq, temp, FFS, op0, 0);
2521   emit_insn (seq);
2522   return temp;
2523
2524  fail:
2525   end_sequence ();
2526   return 0;
2527 }
2528
2529 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2530    conditions, VAL may already be a SUBREG against which we cannot generate
2531    a further SUBREG.  In this case, we expect forcing the value into a
2532    register will work around the situation.  */
2533
2534 static rtx
2535 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2536                            machine_mode imode)
2537 {
2538   rtx ret;
2539   ret = lowpart_subreg (omode, val, imode);
2540   if (ret == NULL)
2541     {
2542       val = force_reg (imode, val);
2543       ret = lowpart_subreg (omode, val, imode);
2544       gcc_assert (ret != NULL);
2545     }
2546   return ret;
2547 }
2548
2549 /* Expand a floating point absolute value or negation operation via a
2550    logical operation on the sign bit.  */
2551
2552 static rtx
2553 expand_absneg_bit (enum rtx_code code, scalar_float_mode mode,
2554                    rtx op0, rtx target)
2555 {
2556   const struct real_format *fmt;
2557   int bitpos, word, nwords, i;
2558   scalar_int_mode imode;
2559   rtx temp;
2560   rtx_insn *insns;
2561
2562   /* The format has to have a simple sign bit.  */
2563   fmt = REAL_MODE_FORMAT (mode);
2564   if (fmt == NULL)
2565     return NULL_RTX;
2566
2567   bitpos = fmt->signbit_rw;
2568   if (bitpos < 0)
2569     return NULL_RTX;
2570
2571   /* Don't create negative zeros if the format doesn't support them.  */
2572   if (code == NEG && !fmt->has_signed_zero)
2573     return NULL_RTX;
2574
2575   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2576     {
2577       if (!int_mode_for_mode (mode).exists (&imode))
2578         return NULL_RTX;
2579       word = 0;
2580       nwords = 1;
2581     }
2582   else
2583     {
2584       imode = word_mode;
2585
2586       if (FLOAT_WORDS_BIG_ENDIAN)
2587         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2588       else
2589         word = bitpos / BITS_PER_WORD;
2590       bitpos = bitpos % BITS_PER_WORD;
2591       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2592     }
2593
2594   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2595   if (code == ABS)
2596     mask = ~mask;
2597
2598   if (target == 0
2599       || target == op0
2600       || (nwords > 1 && !valid_multiword_target_p (target)))
2601     target = gen_reg_rtx (mode);
2602
2603   if (nwords > 1)
2604     {
2605       start_sequence ();
2606
2607       for (i = 0; i < nwords; ++i)
2608         {
2609           rtx targ_piece = operand_subword (target, i, 1, mode);
2610           rtx op0_piece = operand_subword_force (op0, i, mode);
2611
2612           if (i == word)
2613             {
2614               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2615                                    op0_piece,
2616                                    immed_wide_int_const (mask, imode),
2617                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2618               if (temp != targ_piece)
2619                 emit_move_insn (targ_piece, temp);
2620             }
2621           else
2622             emit_move_insn (targ_piece, op0_piece);
2623         }
2624
2625       insns = get_insns ();
2626       end_sequence ();
2627
2628       emit_insn (insns);
2629     }
2630   else
2631     {
2632       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2633                            gen_lowpart (imode, op0),
2634                            immed_wide_int_const (mask, imode),
2635                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2636       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2637
2638       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2639                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2640                         target);
2641     }
2642
2643   return target;
2644 }
2645
2646 /* As expand_unop, but will fail rather than attempt the operation in a
2647    different mode or with a libcall.  */
2648 static rtx
2649 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2650                     int unsignedp)
2651 {
2652   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2653     {
2654       struct expand_operand ops[2];
2655       enum insn_code icode = optab_handler (unoptab, mode);
2656       rtx_insn *last = get_last_insn ();
2657       rtx_insn *pat;
2658
2659       create_output_operand (&ops[0], target, mode);
2660       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2661       pat = maybe_gen_insn (icode, 2, ops);
2662       if (pat)
2663         {
2664           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
2665               && ! add_equal_note (pat, ops[0].value,
2666                                    optab_to_code (unoptab),
2667                                    ops[1].value, NULL_RTX))
2668             {
2669               delete_insns_since (last);
2670               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
2671             }
2672
2673           emit_insn (pat);
2674
2675           return ops[0].value;
2676         }
2677     }
2678   return 0;
2679 }
2680
2681 /* Generate code to perform an operation specified by UNOPTAB
2682    on operand OP0, with result having machine-mode MODE.
2683
2684    UNSIGNEDP is for the case where we have to widen the operands
2685    to perform the operation.  It says to use zero-extension.
2686
2687    If TARGET is nonzero, the value
2688    is generated there, if it is convenient to do so.
2689    In all cases an rtx is returned for the locus of the value;
2690    this may or may not be TARGET.  */
2691
2692 rtx
2693 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
2694              int unsignedp)
2695 {
2696   enum mode_class mclass = GET_MODE_CLASS (mode);
2697   machine_mode wider_mode;
2698   scalar_int_mode int_mode;
2699   scalar_float_mode float_mode;
2700   rtx temp;
2701   rtx libfunc;
2702
2703   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
2704   if (temp)
2705     return temp;
2706
2707   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
2708
2709   /* Widening (or narrowing) clz needs special treatment.  */
2710   if (unoptab == clz_optab)
2711     {
2712       if (is_a <scalar_int_mode> (mode, &int_mode))
2713         {
2714           temp = widen_leading (int_mode, op0, target, unoptab);
2715           if (temp)
2716             return temp;
2717
2718           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2719               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2720             {
2721               temp = expand_doubleword_clz (int_mode, op0, target);
2722               if (temp)
2723                 return temp;
2724             }
2725         }
2726
2727       goto try_libcall;
2728     }
2729
2730   if (unoptab == clrsb_optab)
2731     {
2732       if (is_a <scalar_int_mode> (mode, &int_mode))
2733         {
2734           temp = widen_leading (int_mode, op0, target, unoptab);
2735           if (temp)
2736             return temp;
2737         }
2738       goto try_libcall;
2739     }
2740
2741   if (unoptab == popcount_optab
2742       && is_a <scalar_int_mode> (mode, &int_mode)
2743       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2744       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2745       && optimize_insn_for_speed_p ())
2746     {
2747       temp = expand_doubleword_popcount (int_mode, op0, target);
2748       if (temp)
2749         return temp;
2750     }
2751
2752   if (unoptab == parity_optab
2753       && is_a <scalar_int_mode> (mode, &int_mode)
2754       && GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2755       && (optab_handler (unoptab, word_mode) != CODE_FOR_nothing
2756           || optab_handler (popcount_optab, word_mode) != CODE_FOR_nothing)
2757       && optimize_insn_for_speed_p ())
2758     {
2759       temp = expand_doubleword_parity (int_mode, op0, target);
2760       if (temp)
2761         return temp;
2762     }
2763
2764   /* Widening (or narrowing) bswap needs special treatment.  */
2765   if (unoptab == bswap_optab)
2766     {
2767       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
2768          or ROTATERT.  First try these directly; if this fails, then try the
2769          obvious pair of shifts with allowed widening, as this will probably
2770          be always more efficient than the other fallback methods.  */
2771       if (mode == HImode)
2772         {
2773           rtx_insn *last;
2774           rtx temp1, temp2;
2775
2776           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
2777             {
2778               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
2779                                    unsignedp, OPTAB_DIRECT);
2780               if (temp)
2781                 return temp;
2782              }
2783
2784           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
2785             {
2786               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
2787                                    unsignedp, OPTAB_DIRECT);
2788               if (temp)
2789                 return temp;
2790             }
2791
2792           last = get_last_insn ();
2793
2794           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
2795                                 unsignedp, OPTAB_WIDEN);
2796           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
2797                                 unsignedp, OPTAB_WIDEN);
2798           if (temp1 && temp2)
2799             {
2800               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
2801                                    unsignedp, OPTAB_WIDEN);
2802               if (temp)
2803                 return temp;
2804             }
2805
2806           delete_insns_since (last);
2807         }
2808
2809       if (is_a <scalar_int_mode> (mode, &int_mode))
2810         {
2811           temp = widen_bswap (int_mode, op0, target);
2812           if (temp)
2813             return temp;
2814
2815           if (GET_MODE_SIZE (int_mode) == 2 * UNITS_PER_WORD
2816               && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2817             {
2818               temp = expand_doubleword_bswap (mode, op0, target);
2819               if (temp)
2820                 return temp;
2821             }
2822         }
2823
2824       goto try_libcall;
2825     }
2826
2827   if (CLASS_HAS_WIDER_MODES_P (mclass))
2828     FOR_EACH_WIDER_MODE (wider_mode, mode)
2829       {
2830         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2831           {
2832             rtx xop0 = op0;
2833             rtx_insn *last = get_last_insn ();
2834
2835             /* For certain operations, we need not actually extend
2836                the narrow operand, as long as we will truncate the
2837                results to the same narrowness.  */
2838
2839             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
2840                                   (unoptab == neg_optab
2841                                    || unoptab == one_cmpl_optab)
2842                                   && mclass == MODE_INT);
2843
2844             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2845                                 unsignedp);
2846
2847             if (temp)
2848               {
2849                 if (mclass != MODE_INT
2850                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2851                   {
2852                     if (target == 0)
2853                       target = gen_reg_rtx (mode);
2854                     convert_move (target, temp, 0);
2855                     return target;
2856                   }
2857                 else
2858                   return gen_lowpart (mode, temp);
2859               }
2860             else
2861               delete_insns_since (last);
2862           }
2863       }
2864
2865   /* These can be done a word at a time.  */
2866   if (unoptab == one_cmpl_optab
2867       && is_int_mode (mode, &int_mode)
2868       && GET_MODE_SIZE (int_mode) > UNITS_PER_WORD
2869       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
2870     {
2871       int i;
2872       rtx_insn *insns;
2873
2874       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
2875         target = gen_reg_rtx (int_mode);
2876
2877       start_sequence ();
2878
2879       /* Do the actual arithmetic.  */
2880       for (i = 0; i < GET_MODE_BITSIZE (int_mode) / BITS_PER_WORD; i++)
2881         {
2882           rtx target_piece = operand_subword (target, i, 1, int_mode);
2883           rtx x = expand_unop (word_mode, unoptab,
2884                                operand_subword_force (op0, i, int_mode),
2885                                target_piece, unsignedp);
2886
2887           if (target_piece != x)
2888             emit_move_insn (target_piece, x);
2889         }
2890
2891       insns = get_insns ();
2892       end_sequence ();
2893
2894       emit_insn (insns);
2895       return target;
2896     }
2897
2898   if (optab_to_code (unoptab) == NEG)
2899     {
2900       /* Try negating floating point values by flipping the sign bit.  */
2901       if (is_a <scalar_float_mode> (mode, &float_mode))
2902         {
2903           temp = expand_absneg_bit (NEG, float_mode, op0, target);
2904           if (temp)
2905             return temp;
2906         }
2907
2908       /* If there is no negation pattern, and we have no negative zero,
2909          try subtracting from zero.  */
2910       if (!HONOR_SIGNED_ZEROS (mode))
2911         {
2912           temp = expand_binop (mode, (unoptab == negv_optab
2913                                       ? subv_optab : sub_optab),
2914                                CONST0_RTX (mode), op0, target,
2915                                unsignedp, OPTAB_DIRECT);
2916           if (temp)
2917             return temp;
2918         }
2919     }
2920
2921   /* Try calculating parity (x) as popcount (x) % 2.  */
2922   if (unoptab == parity_optab && is_a <scalar_int_mode> (mode, &int_mode))
2923     {
2924       temp = expand_parity (int_mode, op0, target);
2925       if (temp)
2926         return temp;
2927     }
2928
2929   /* Try implementing ffs (x) in terms of clz (x).  */
2930   if (unoptab == ffs_optab && is_a <scalar_int_mode> (mode, &int_mode))
2931     {
2932       temp = expand_ffs (int_mode, op0, target);
2933       if (temp)
2934         return temp;
2935     }
2936
2937   /* Try implementing ctz (x) in terms of clz (x).  */
2938   if (unoptab == ctz_optab && is_a <scalar_int_mode> (mode, &int_mode))
2939     {
2940       temp = expand_ctz (int_mode, op0, target);
2941       if (temp)
2942         return temp;
2943     }
2944
2945  try_libcall:
2946   /* Now try a library call in this mode.  */
2947   libfunc = optab_libfunc (unoptab, mode);
2948   if (libfunc)
2949     {
2950       rtx_insn *insns;
2951       rtx value;
2952       rtx eq_value;
2953       machine_mode outmode = mode;
2954
2955       /* All of these functions return small values.  Thus we choose to
2956          have them return something that isn't a double-word.  */
2957       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
2958           || unoptab == clrsb_optab || unoptab == popcount_optab
2959           || unoptab == parity_optab)
2960         outmode
2961           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
2962                                           optab_libfunc (unoptab, mode)));
2963
2964       start_sequence ();
2965
2966       /* Pass 1 for NO_QUEUE so we don't lose any increments
2967          if the libcall is cse'd or moved.  */
2968       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
2969                                        1, op0, mode);
2970       insns = get_insns ();
2971       end_sequence ();
2972
2973       target = gen_reg_rtx (outmode);
2974       bool trapv = trapv_unoptab_p (unoptab);
2975       if (trapv)
2976         eq_value = NULL_RTX;
2977       else
2978         {
2979           eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
2980           if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
2981             eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
2982           else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
2983             eq_value = simplify_gen_unary (ZERO_EXTEND,
2984                                            outmode, eq_value, mode);
2985         }
2986       emit_libcall_block_1 (insns, target, value, eq_value, trapv);
2987
2988       return target;
2989     }
2990
2991   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2992
2993   if (CLASS_HAS_WIDER_MODES_P (mclass))
2994     {
2995       FOR_EACH_WIDER_MODE (wider_mode, mode)
2996         {
2997           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
2998               || optab_libfunc (unoptab, wider_mode))
2999             {
3000               rtx xop0 = op0;
3001               rtx_insn *last = get_last_insn ();
3002
3003               /* For certain operations, we need not actually extend
3004                  the narrow operand, as long as we will truncate the
3005                  results to the same narrowness.  */
3006               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3007                                     (unoptab == neg_optab
3008                                      || unoptab == one_cmpl_optab
3009                                      || unoptab == bswap_optab)
3010                                     && mclass == MODE_INT);
3011
3012               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3013                                   unsignedp);
3014
3015               /* If we are generating clz using wider mode, adjust the
3016                  result.  Similarly for clrsb.  */
3017               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3018                   && temp != 0)
3019                 {
3020                   scalar_int_mode wider_int_mode
3021                     = as_a <scalar_int_mode> (wider_mode);
3022                   int_mode = as_a <scalar_int_mode> (mode);
3023                   temp = expand_binop
3024                     (wider_mode, sub_optab, temp,
3025                      gen_int_mode (GET_MODE_PRECISION (wider_int_mode)
3026                                    - GET_MODE_PRECISION (int_mode),
3027                                    wider_int_mode),
3028                      target, true, OPTAB_DIRECT);
3029                 }
3030
3031               /* Likewise for bswap.  */
3032               if (unoptab == bswap_optab && temp != 0)
3033                 {
3034                   scalar_int_mode wider_int_mode
3035                     = as_a <scalar_int_mode> (wider_mode);
3036                   int_mode = as_a <scalar_int_mode> (mode);
3037                   gcc_assert (GET_MODE_PRECISION (wider_int_mode)
3038                               == GET_MODE_BITSIZE (wider_int_mode)
3039                               && GET_MODE_PRECISION (int_mode)
3040                                  == GET_MODE_BITSIZE (int_mode));
3041
3042                   temp = expand_shift (RSHIFT_EXPR, wider_int_mode, temp,
3043                                        GET_MODE_BITSIZE (wider_int_mode)
3044                                        - GET_MODE_BITSIZE (int_mode),
3045                                        NULL_RTX, true);
3046                 }
3047
3048               if (temp)
3049                 {
3050                   if (mclass != MODE_INT)
3051                     {
3052                       if (target == 0)
3053                         target = gen_reg_rtx (mode);
3054                       convert_move (target, temp, 0);
3055                       return target;
3056                     }
3057                   else
3058                     return gen_lowpart (mode, temp);
3059                 }
3060               else
3061                 delete_insns_since (last);
3062             }
3063         }
3064     }
3065
3066   /* One final attempt at implementing negation via subtraction,
3067      this time allowing widening of the operand.  */
3068   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3069     {
3070       rtx temp;
3071       temp = expand_binop (mode,
3072                            unoptab == negv_optab ? subv_optab : sub_optab,
3073                            CONST0_RTX (mode), op0,
3074                            target, unsignedp, OPTAB_LIB_WIDEN);
3075       if (temp)
3076         return temp;
3077     }
3078
3079   return 0;
3080 }
3081 \f
3082 /* Emit code to compute the absolute value of OP0, with result to
3083    TARGET if convenient.  (TARGET may be 0.)  The return value says
3084    where the result actually is to be found.
3085
3086    MODE is the mode of the operand; the mode of the result is
3087    different but can be deduced from MODE.
3088
3089  */
3090
3091 rtx
3092 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3093                    int result_unsignedp)
3094 {
3095   rtx temp;
3096
3097   if (GET_MODE_CLASS (mode) != MODE_INT
3098       || ! flag_trapv)
3099     result_unsignedp = 1;
3100
3101   /* First try to do it with a special abs instruction.  */
3102   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3103                       op0, target, 0);
3104   if (temp != 0)
3105     return temp;
3106
3107   /* For floating point modes, try clearing the sign bit.  */
3108   scalar_float_mode float_mode;
3109   if (is_a <scalar_float_mode> (mode, &float_mode))
3110     {
3111       temp = expand_absneg_bit (ABS, float_mode, op0, target);
3112       if (temp)
3113         return temp;
3114     }
3115
3116   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3117   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3118       && !HONOR_SIGNED_ZEROS (mode))
3119     {
3120       rtx_insn *last = get_last_insn ();
3121
3122       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3123                           op0, NULL_RTX, 0);
3124       if (temp != 0)
3125         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3126                              OPTAB_WIDEN);
3127
3128       if (temp != 0)
3129         return temp;
3130
3131       delete_insns_since (last);
3132     }
3133
3134   /* If this machine has expensive jumps, we can do integer absolute
3135      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3136      where W is the width of MODE.  */
3137
3138   scalar_int_mode int_mode;
3139   if (is_int_mode (mode, &int_mode)
3140       && BRANCH_COST (optimize_insn_for_speed_p (),
3141                       false) >= 2)
3142     {
3143       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3144                                    GET_MODE_PRECISION (int_mode) - 1,
3145                                    NULL_RTX, 0);
3146
3147       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3148                            OPTAB_LIB_WIDEN);
3149       if (temp != 0)
3150         temp = expand_binop (int_mode,
3151                              result_unsignedp ? sub_optab : subv_optab,
3152                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3153
3154       if (temp != 0)
3155         return temp;
3156     }
3157
3158   return NULL_RTX;
3159 }
3160
3161 rtx
3162 expand_abs (machine_mode mode, rtx op0, rtx target,
3163             int result_unsignedp, int safe)
3164 {
3165   rtx temp;
3166   rtx_code_label *op1;
3167
3168   if (GET_MODE_CLASS (mode) != MODE_INT
3169       || ! flag_trapv)
3170     result_unsignedp = 1;
3171
3172   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3173   if (temp != 0)
3174     return temp;
3175
3176   /* If that does not win, use conditional jump and negate.  */
3177
3178   /* It is safe to use the target if it is the same
3179      as the source if this is also a pseudo register */
3180   if (op0 == target && REG_P (op0)
3181       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3182     safe = 1;
3183
3184   op1 = gen_label_rtx ();
3185   if (target == 0 || ! safe
3186       || GET_MODE (target) != mode
3187       || (MEM_P (target) && MEM_VOLATILE_P (target))
3188       || (REG_P (target)
3189           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3190     target = gen_reg_rtx (mode);
3191
3192   emit_move_insn (target, op0);
3193   NO_DEFER_POP;
3194
3195   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3196                            NULL_RTX, NULL, op1,
3197                            profile_probability::uninitialized ());
3198
3199   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3200                      target, target, 0);
3201   if (op0 != target)
3202     emit_move_insn (target, op0);
3203   emit_label (op1);
3204   OK_DEFER_POP;
3205   return target;
3206 }
3207
3208 /* Emit code to compute the one's complement absolute value of OP0
3209    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3210    (TARGET may be NULL_RTX.)  The return value says where the result
3211    actually is to be found.
3212
3213    MODE is the mode of the operand; the mode of the result is
3214    different but can be deduced from MODE.  */
3215
3216 rtx
3217 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3218 {
3219   rtx temp;
3220
3221   /* Not applicable for floating point modes.  */
3222   if (FLOAT_MODE_P (mode))
3223     return NULL_RTX;
3224
3225   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3226   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3227     {
3228       rtx_insn *last = get_last_insn ();
3229
3230       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3231       if (temp != 0)
3232         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3233                              OPTAB_WIDEN);
3234
3235       if (temp != 0)
3236         return temp;
3237
3238       delete_insns_since (last);
3239     }
3240
3241   /* If this machine has expensive jumps, we can do one's complement
3242      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3243
3244   scalar_int_mode int_mode;
3245   if (is_int_mode (mode, &int_mode)
3246       && BRANCH_COST (optimize_insn_for_speed_p (),
3247                      false) >= 2)
3248     {
3249       rtx extended = expand_shift (RSHIFT_EXPR, int_mode, op0,
3250                                    GET_MODE_PRECISION (int_mode) - 1,
3251                                    NULL_RTX, 0);
3252
3253       temp = expand_binop (int_mode, xor_optab, extended, op0, target, 0,
3254                            OPTAB_LIB_WIDEN);
3255
3256       if (temp != 0)
3257         return temp;
3258     }
3259
3260   return NULL_RTX;
3261 }
3262
3263 /* A subroutine of expand_copysign, perform the copysign operation using the
3264    abs and neg primitives advertised to exist on the target.  The assumption
3265    is that we have a split register file, and leaving op0 in fp registers,
3266    and not playing with subregs so much, will help the register allocator.  */
3267
3268 static rtx
3269 expand_copysign_absneg (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3270                         int bitpos, bool op0_is_abs)
3271 {
3272   scalar_int_mode imode;
3273   enum insn_code icode;
3274   rtx sign;
3275   rtx_code_label *label;
3276
3277   if (target == op1)
3278     target = NULL_RTX;
3279
3280   /* Check if the back end provides an insn that handles signbit for the
3281      argument's mode. */
3282   icode = optab_handler (signbit_optab, mode);
3283   if (icode != CODE_FOR_nothing)
3284     {
3285       imode = as_a <scalar_int_mode> (insn_data[(int) icode].operand[0].mode);
3286       sign = gen_reg_rtx (imode);
3287       emit_unop_insn (icode, sign, op1, UNKNOWN);
3288     }
3289   else
3290     {
3291       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3292         {
3293           if (!int_mode_for_mode (mode).exists (&imode))
3294             return NULL_RTX;
3295           op1 = gen_lowpart (imode, op1);
3296         }
3297       else
3298         {
3299           int word;
3300
3301           imode = word_mode;
3302           if (FLOAT_WORDS_BIG_ENDIAN)
3303             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3304           else
3305             word = bitpos / BITS_PER_WORD;
3306           bitpos = bitpos % BITS_PER_WORD;
3307           op1 = operand_subword_force (op1, word, mode);
3308         }
3309
3310       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3311       sign = expand_binop (imode, and_optab, op1,
3312                            immed_wide_int_const (mask, imode),
3313                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3314     }
3315
3316   if (!op0_is_abs)
3317     {
3318       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3319       if (op0 == NULL)
3320         return NULL_RTX;
3321       target = op0;
3322     }
3323   else
3324     {
3325       if (target == NULL_RTX)
3326         target = copy_to_reg (op0);
3327       else
3328         emit_move_insn (target, op0);
3329     }
3330
3331   label = gen_label_rtx ();
3332   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3333
3334   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3335     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3336   else
3337     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3338   if (op0 != target)
3339     emit_move_insn (target, op0);
3340
3341   emit_label (label);
3342
3343   return target;
3344 }
3345
3346
3347 /* A subroutine of expand_copysign, perform the entire copysign operation
3348    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3349    is true if op0 is known to have its sign bit clear.  */
3350
3351 static rtx
3352 expand_copysign_bit (scalar_float_mode mode, rtx op0, rtx op1, rtx target,
3353                      int bitpos, bool op0_is_abs)
3354 {
3355   scalar_int_mode imode;
3356   int word, nwords, i;
3357   rtx temp;
3358   rtx_insn *insns;
3359
3360   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3361     {
3362       if (!int_mode_for_mode (mode).exists (&imode))
3363         return NULL_RTX;
3364       word = 0;
3365       nwords = 1;
3366     }
3367   else
3368     {
3369       imode = word_mode;
3370
3371       if (FLOAT_WORDS_BIG_ENDIAN)
3372         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3373       else
3374         word = bitpos / BITS_PER_WORD;
3375       bitpos = bitpos % BITS_PER_WORD;
3376       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3377     }
3378
3379   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3380
3381   if (target == 0
3382       || target == op0
3383       || target == op1
3384       || (nwords > 1 && !valid_multiword_target_p (target)))
3385     target = gen_reg_rtx (mode);
3386
3387   if (nwords > 1)
3388     {
3389       start_sequence ();
3390
3391       for (i = 0; i < nwords; ++i)
3392         {
3393           rtx targ_piece = operand_subword (target, i, 1, mode);
3394           rtx op0_piece = operand_subword_force (op0, i, mode);
3395
3396           if (i == word)
3397             {
3398               if (!op0_is_abs)
3399                 op0_piece
3400                   = expand_binop (imode, and_optab, op0_piece,
3401                                   immed_wide_int_const (~mask, imode),
3402                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3403               op1 = expand_binop (imode, and_optab,
3404                                   operand_subword_force (op1, i, mode),
3405                                   immed_wide_int_const (mask, imode),
3406                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3407
3408               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3409                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3410               if (temp != targ_piece)
3411                 emit_move_insn (targ_piece, temp);
3412             }
3413           else
3414             emit_move_insn (targ_piece, op0_piece);
3415         }
3416
3417       insns = get_insns ();
3418       end_sequence ();
3419
3420       emit_insn (insns);
3421     }
3422   else
3423     {
3424       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3425                           immed_wide_int_const (mask, imode),
3426                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3427
3428       op0 = gen_lowpart (imode, op0);
3429       if (!op0_is_abs)
3430         op0 = expand_binop (imode, and_optab, op0,
3431                             immed_wide_int_const (~mask, imode),
3432                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3433
3434       temp = expand_binop (imode, ior_optab, op0, op1,
3435                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3436       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3437     }
3438
3439   return target;
3440 }
3441
3442 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3443    scalar floating point mode.  Return NULL if we do not know how to
3444    expand the operation inline.  */
3445
3446 rtx
3447 expand_copysign (rtx op0, rtx op1, rtx target)
3448 {
3449   scalar_float_mode mode;
3450   const struct real_format *fmt;
3451   bool op0_is_abs;
3452   rtx temp;
3453
3454   mode = as_a <scalar_float_mode> (GET_MODE (op0));
3455   gcc_assert (GET_MODE (op1) == mode);
3456
3457   /* First try to do it with a special instruction.  */
3458   temp = expand_binop (mode, copysign_optab, op0, op1,
3459                        target, 0, OPTAB_DIRECT);
3460   if (temp)
3461     return temp;
3462
3463   fmt = REAL_MODE_FORMAT (mode);
3464   if (fmt == NULL || !fmt->has_signed_zero)
3465     return NULL_RTX;
3466
3467   op0_is_abs = false;
3468   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3469     {
3470       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3471         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3472       op0_is_abs = true;
3473     }
3474
3475   if (fmt->signbit_ro >= 0
3476       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3477           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3478               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3479     {
3480       temp = expand_copysign_absneg (mode, op0, op1, target,
3481                                      fmt->signbit_ro, op0_is_abs);
3482       if (temp)
3483         return temp;
3484     }
3485
3486   if (fmt->signbit_rw < 0)
3487     return NULL_RTX;
3488   return expand_copysign_bit (mode, op0, op1, target,
3489                               fmt->signbit_rw, op0_is_abs);
3490 }
3491 \f
3492 /* Generate an instruction whose insn-code is INSN_CODE,
3493    with two operands: an output TARGET and an input OP0.
3494    TARGET *must* be nonzero, and the output is always stored there.
3495    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3496    the value that is stored into TARGET.
3497
3498    Return false if expansion failed.  */
3499
3500 bool
3501 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3502                       enum rtx_code code)
3503 {
3504   struct expand_operand ops[2];
3505   rtx_insn *pat;
3506
3507   create_output_operand (&ops[0], target, GET_MODE (target));
3508   create_input_operand (&ops[1], op0, GET_MODE (op0));
3509   pat = maybe_gen_insn (icode, 2, ops);
3510   if (!pat)
3511     return false;
3512
3513   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3514       && code != UNKNOWN)
3515     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3516
3517   emit_insn (pat);
3518
3519   if (ops[0].value != target)
3520     emit_move_insn (target, ops[0].value);
3521   return true;
3522 }
3523 /* Generate an instruction whose insn-code is INSN_CODE,
3524    with two operands: an output TARGET and an input OP0.
3525    TARGET *must* be nonzero, and the output is always stored there.
3526    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3527    the value that is stored into TARGET.  */
3528
3529 void
3530 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3531 {
3532   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3533   gcc_assert (ok);
3534 }
3535 \f
3536 struct no_conflict_data
3537 {
3538   rtx target;
3539   rtx_insn *first, *insn;
3540   bool must_stay;
3541 };
3542
3543 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3544    the currently examined clobber / store has to stay in the list of
3545    insns that constitute the actual libcall block.  */
3546 static void
3547 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3548 {
3549   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3550
3551   /* If this inns directly contributes to setting the target, it must stay.  */
3552   if (reg_overlap_mentioned_p (p->target, dest))
3553     p->must_stay = true;
3554   /* If we haven't committed to keeping any other insns in the list yet,
3555      there is nothing more to check.  */
3556   else if (p->insn == p->first)
3557     return;
3558   /* If this insn sets / clobbers a register that feeds one of the insns
3559      already in the list, this insn has to stay too.  */
3560   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3561            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3562            || reg_used_between_p (dest, p->first, p->insn)
3563            /* Likewise if this insn depends on a register set by a previous
3564               insn in the list, or if it sets a result (presumably a hard
3565               register) that is set or clobbered by a previous insn.
3566               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3567               SET_DEST perform the former check on the address, and the latter
3568               check on the MEM.  */
3569            || (GET_CODE (set) == SET
3570                && (modified_in_p (SET_SRC (set), p->first)
3571                    || modified_in_p (SET_DEST (set), p->first)
3572                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3573                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3574     p->must_stay = true;
3575 }
3576
3577 \f
3578 /* Emit code to make a call to a constant function or a library call.
3579
3580    INSNS is a list containing all insns emitted in the call.
3581    These insns leave the result in RESULT.  Our block is to copy RESULT
3582    to TARGET, which is logically equivalent to EQUIV.
3583
3584    We first emit any insns that set a pseudo on the assumption that these are
3585    loading constants into registers; doing so allows them to be safely cse'ed
3586    between blocks.  Then we emit all the other insns in the block, followed by
3587    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3588    note with an operand of EQUIV.  */
3589
3590 static void
3591 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3592                       bool equiv_may_trap)
3593 {
3594   rtx final_dest = target;
3595   rtx_insn *next, *last, *insn;
3596
3597   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3598      into a MEM later.  Protect the libcall block from this change.  */
3599   if (! REG_P (target) || REG_USERVAR_P (target))
3600     target = gen_reg_rtx (GET_MODE (target));
3601
3602   /* If we're using non-call exceptions, a libcall corresponding to an
3603      operation that may trap may also trap.  */
3604   /* ??? See the comment in front of make_reg_eh_region_note.  */
3605   if (cfun->can_throw_non_call_exceptions
3606       && (equiv_may_trap || may_trap_p (equiv)))
3607     {
3608       for (insn = insns; insn; insn = NEXT_INSN (insn))
3609         if (CALL_P (insn))
3610           {
3611             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3612             if (note)
3613               {
3614                 int lp_nr = INTVAL (XEXP (note, 0));
3615                 if (lp_nr == 0 || lp_nr == INT_MIN)
3616                   remove_note (insn, note);
3617               }
3618           }
3619     }
3620   else
3621     {
3622       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3623          reg note to indicate that this call cannot throw or execute a nonlocal
3624          goto (unless there is already a REG_EH_REGION note, in which case
3625          we update it).  */
3626       for (insn = insns; insn; insn = NEXT_INSN (insn))
3627         if (CALL_P (insn))
3628           make_reg_eh_region_note_nothrow_nononlocal (insn);
3629     }
3630
3631   /* First emit all insns that set pseudos.  Remove them from the list as
3632      we go.  Avoid insns that set pseudos which were referenced in previous
3633      insns.  These can be generated by move_by_pieces, for example,
3634      to update an address.  Similarly, avoid insns that reference things
3635      set in previous insns.  */
3636
3637   for (insn = insns; insn; insn = next)
3638     {
3639       rtx set = single_set (insn);
3640
3641       next = NEXT_INSN (insn);
3642
3643       if (set != 0 && REG_P (SET_DEST (set))
3644           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3645         {
3646           struct no_conflict_data data;
3647
3648           data.target = const0_rtx;
3649           data.first = insns;
3650           data.insn = insn;
3651           data.must_stay = 0;
3652           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3653           if (! data.must_stay)
3654             {
3655               if (PREV_INSN (insn))
3656                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3657               else
3658                 insns = next;
3659
3660               if (next)
3661                 SET_PREV_INSN (next) = PREV_INSN (insn);
3662
3663               add_insn (insn);
3664             }
3665         }
3666
3667       /* Some ports use a loop to copy large arguments onto the stack.
3668          Don't move anything outside such a loop.  */
3669       if (LABEL_P (insn))
3670         break;
3671     }
3672
3673   /* Write the remaining insns followed by the final copy.  */
3674   for (insn = insns; insn; insn = next)
3675     {
3676       next = NEXT_INSN (insn);
3677
3678       add_insn (insn);
3679     }
3680
3681   last = emit_move_insn (target, result);
3682   if (equiv)
3683     set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3684
3685   if (final_dest != target)
3686     emit_move_insn (final_dest, target);
3687 }
3688
3689 void
3690 emit_libcall_block (rtx_insn *insns, rtx target, rtx result, rtx equiv)
3691 {
3692   emit_libcall_block_1 (insns, target, result, equiv, false);
3693 }
3694 \f
3695 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3696    PURPOSE describes how this comparison will be used.  CODE is the rtx
3697    comparison code we will be using.
3698
3699    ??? Actually, CODE is slightly weaker than that.  A target is still
3700    required to implement all of the normal bcc operations, but not
3701    required to implement all (or any) of the unordered bcc operations.  */
3702
3703 int
3704 can_compare_p (enum rtx_code code, machine_mode mode,
3705                enum can_compare_purpose purpose)
3706 {
3707   rtx test;
3708   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3709   do
3710     {
3711       enum insn_code icode;
3712
3713       if (purpose == ccp_jump
3714           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3715           && insn_operand_matches (icode, 0, test))
3716         return 1;
3717       if (purpose == ccp_store_flag
3718           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
3719           && insn_operand_matches (icode, 1, test))
3720         return 1;
3721       if (purpose == ccp_cmov
3722           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
3723         return 1;
3724
3725       mode = GET_MODE_WIDER_MODE (mode).else_void ();
3726       PUT_MODE (test, mode);
3727     }
3728   while (mode != VOIDmode);
3729
3730   return 0;
3731 }
3732
3733 /* This function is called when we are going to emit a compare instruction that
3734    compares the values found in X and Y, using the rtl operator COMPARISON.
3735
3736    If they have mode BLKmode, then SIZE specifies the size of both operands.
3737
3738    UNSIGNEDP nonzero says that the operands are unsigned;
3739    this matters if they need to be widened (as given by METHODS).
3740
3741    *PTEST is where the resulting comparison RTX is returned or NULL_RTX
3742    if we failed to produce one.
3743
3744    *PMODE is the mode of the inputs (in case they are const_int).
3745
3746    This function performs all the setup necessary so that the caller only has
3747    to emit a single comparison insn.  This setup can involve doing a BLKmode
3748    comparison or emitting a library call to perform the comparison if no insn
3749    is available to handle it.
3750    The values which are passed in through pointers can be modified; the caller
3751    should perform the comparison on the modified values.  Constant
3752    comparisons must have already been folded.  */
3753
3754 static void
3755 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
3756                   int unsignedp, enum optab_methods methods,
3757                   rtx *ptest, machine_mode *pmode)
3758 {
3759   machine_mode mode = *pmode;
3760   rtx libfunc, test;
3761   machine_mode cmp_mode;
3762   enum mode_class mclass;
3763
3764   /* The other methods are not needed.  */
3765   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
3766               || methods == OPTAB_LIB_WIDEN);
3767
3768   /* If we are optimizing, force expensive constants into a register.  */
3769   if (CONSTANT_P (x) && optimize
3770       && (rtx_cost (x, mode, COMPARE, 0, optimize_insn_for_speed_p ())
3771           > COSTS_N_INSNS (1)))
3772     x = force_reg (mode, x);
3773
3774   if (CONSTANT_P (y) && optimize
3775       && (rtx_cost (y, mode, COMPARE, 1, optimize_insn_for_speed_p ())
3776           > COSTS_N_INSNS (1)))
3777     y = force_reg (mode, y);
3778
3779 #if HAVE_cc0
3780   /* Make sure if we have a canonical comparison.  The RTL
3781      documentation states that canonical comparisons are required only
3782      for targets which have cc0.  */
3783   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
3784 #endif
3785
3786   /* Don't let both operands fail to indicate the mode.  */
3787   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
3788     x = force_reg (mode, x);
3789   if (mode == VOIDmode)
3790     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
3791
3792   /* Handle all BLKmode compares.  */
3793
3794   if (mode == BLKmode)
3795     {
3796       machine_mode result_mode;
3797       enum insn_code cmp_code;
3798       rtx result;
3799       rtx opalign
3800         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
3801
3802       gcc_assert (size);
3803
3804       /* Try to use a memory block compare insn - either cmpstr
3805          or cmpmem will do.  */
3806       opt_scalar_int_mode cmp_mode_iter;
3807       FOR_EACH_MODE_IN_CLASS (cmp_mode_iter, MODE_INT)
3808         {
3809           scalar_int_mode cmp_mode = cmp_mode_iter.require ();
3810           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
3811           if (cmp_code == CODE_FOR_nothing)
3812             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
3813           if (cmp_code == CODE_FOR_nothing)
3814             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
3815           if (cmp_code == CODE_FOR_nothing)
3816             continue;
3817
3818           /* Must make sure the size fits the insn's mode.  */
3819           if (CONST_INT_P (size)
3820               ? INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode))
3821               : (GET_MODE_BITSIZE (as_a <scalar_int_mode> (GET_MODE (size)))
3822                  > GET_MODE_BITSIZE (cmp_mode)))
3823             continue;
3824
3825           result_mode = insn_data[cmp_code].operand[0].mode;
3826           result = gen_reg_rtx (result_mode);
3827           size = convert_to_mode (cmp_mode, size, 1);
3828           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
3829
3830           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
3831           *pmode = result_mode;
3832           return;
3833         }
3834
3835       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
3836         goto fail;
3837
3838       /* Otherwise call a library function.  */
3839       result = emit_block_comp_via_libcall (XEXP (x, 0), XEXP (y, 0), size);
3840
3841       x = result;
3842       y = const0_rtx;
3843       mode = TYPE_MODE (integer_type_node);
3844       methods = OPTAB_LIB_WIDEN;
3845       unsignedp = false;
3846     }
3847
3848   /* Don't allow operands to the compare to trap, as that can put the
3849      compare and branch in different basic blocks.  */
3850   if (cfun->can_throw_non_call_exceptions)
3851     {
3852       if (may_trap_p (x))
3853         x = copy_to_reg (x);
3854       if (may_trap_p (y))
3855         y = copy_to_reg (y);
3856     }
3857
3858   if (GET_MODE_CLASS (mode) == MODE_CC)
3859     {
3860       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
3861       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3862       gcc_assert (icode != CODE_FOR_nothing
3863                   && insn_operand_matches (icode, 0, test));
3864       *ptest = test;
3865       return;
3866     }
3867
3868   mclass = GET_MODE_CLASS (mode);
3869   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
3870   FOR_EACH_MODE_FROM (cmp_mode, mode)
3871     {
3872       enum insn_code icode;
3873       icode = optab_handler (cbranch_optab, cmp_mode);
3874       if (icode != CODE_FOR_nothing
3875           && insn_operand_matches (icode, 0, test))
3876         {
3877           rtx_insn *last = get_last_insn ();
3878           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
3879           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
3880           if (op0 && op1
3881               && insn_operand_matches (icode, 1, op0)
3882               && insn_operand_matches (icode, 2, op1))
3883             {
3884               XEXP (test, 0) = op0;
3885               XEXP (test, 1) = op1;
3886               *ptest = test;
3887               *pmode = cmp_mode;
3888               return;
3889             }
3890           delete_insns_since (last);
3891         }
3892
3893       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
3894         break;
3895     }
3896
3897   if (methods != OPTAB_LIB_WIDEN)
3898     goto fail;
3899
3900   if (!SCALAR_FLOAT_MODE_P (mode))
3901     {
3902       rtx result;
3903       machine_mode ret_mode;
3904
3905       /* Handle a libcall just for the mode we are using.  */
3906       libfunc = optab_libfunc (cmp_optab, mode);
3907       gcc_assert (libfunc);
3908
3909       /* If we want unsigned, and this mode has a distinct unsigned
3910          comparison routine, use that.  */
3911       if (unsignedp)
3912         {
3913           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
3914           if (ulibfunc)
3915             libfunc = ulibfunc;
3916         }
3917
3918       ret_mode = targetm.libgcc_cmp_return_mode ();
3919       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
3920                                         ret_mode, 2, x, mode, y, mode);
3921
3922       /* There are two kinds of comparison routines. Biased routines
3923          return 0/1/2, and unbiased routines return -1/0/1. Other parts
3924          of gcc expect that the comparison operation is equivalent
3925          to the modified comparison. For signed comparisons compare the
3926          result against 1 in the biased case, and zero in the unbiased
3927          case. For unsigned comparisons always compare against 1 after
3928          biasing the unbiased result by adding 1. This gives us a way to
3929          represent LTU.
3930          The comparisons in the fixed-point helper library are always
3931          biased.  */
3932       x = result;
3933       y = const1_rtx;
3934
3935       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
3936         {
3937           if (unsignedp)
3938             x = plus_constant (ret_mode, result, 1);
3939           else
3940             y = const0_rtx;
3941         }
3942
3943       *pmode = ret_mode;
3944       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
3945                         ptest, pmode);
3946     }
3947   else
3948     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
3949
3950   return;
3951
3952  fail:
3953   *ptest = NULL_RTX;
3954 }
3955
3956 /* Before emitting an insn with code ICODE, make sure that X, which is going
3957    to be used for operand OPNUM of the insn, is converted from mode MODE to
3958    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
3959    that it is accepted by the operand predicate.  Return the new value.  */
3960
3961 rtx
3962 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
3963                  machine_mode wider_mode, int unsignedp)
3964 {
3965   if (mode != wider_mode)
3966     x = convert_modes (wider_mode, mode, x, unsignedp);
3967
3968   if (!insn_operand_matches (icode, opnum, x))
3969     {
3970       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
3971       if (reload_completed)
3972         return NULL_RTX;
3973       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
3974         return NULL_RTX;
3975       x = copy_to_mode_reg (op_mode, x);
3976     }
3977
3978   return x;
3979 }
3980
3981 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
3982    we can do the branch.  */
3983
3984 static void
3985 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label,
3986                           profile_probability prob)
3987 {
3988   machine_mode optab_mode;
3989   enum mode_class mclass;
3990   enum insn_code icode;
3991   rtx_insn *insn;
3992
3993   mclass = GET_MODE_CLASS (mode);
3994   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
3995   icode = optab_handler (cbranch_optab, optab_mode);
3996
3997   gcc_assert (icode != CODE_FOR_nothing);
3998   gcc_assert (insn_operand_matches (icode, 0, test));
3999   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4000                                           XEXP (test, 1), label));
4001   if (prob.initialized_p ()
4002       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4003       && insn
4004       && JUMP_P (insn)
4005       && any_condjump_p (insn)
4006       && !find_reg_note (insn, REG_BR_PROB, 0))
4007     add_reg_br_prob_note (insn, prob);
4008 }
4009
4010 /* Generate code to compare X with Y so that the condition codes are
4011    set and to jump to LABEL if the condition is true.  If X is a
4012    constant and Y is not a constant, then the comparison is swapped to
4013    ensure that the comparison RTL has the canonical form.
4014
4015    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4016    need to be widened.  UNSIGNEDP is also used to select the proper
4017    branch condition code.
4018
4019    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4020
4021    MODE is the mode of the inputs (in case they are const_int).
4022
4023    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4024    It will be potentially converted into an unsigned variant based on
4025    UNSIGNEDP to select a proper jump instruction.
4026
4027    PROB is the probability of jumping to LABEL.  */
4028
4029 void
4030 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4031                          machine_mode mode, int unsignedp, rtx label,
4032                          profile_probability prob)
4033 {
4034   rtx op0 = x, op1 = y;
4035   rtx test;
4036
4037   /* Swap operands and condition to ensure canonical RTL.  */
4038   if (swap_commutative_operands_p (x, y)
4039       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4040     {
4041       op0 = y, op1 = x;
4042       comparison = swap_condition (comparison);
4043     }
4044
4045   /* If OP0 is still a constant, then both X and Y must be constants
4046      or the opposite comparison is not supported.  Force X into a register
4047      to create canonical RTL.  */
4048   if (CONSTANT_P (op0))
4049     op0 = force_reg (mode, op0);
4050
4051   if (unsignedp)
4052     comparison = unsigned_condition (comparison);
4053
4054   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4055                     &test, &mode);
4056   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4057 }
4058
4059 \f
4060 /* Emit a library call comparison between floating point X and Y.
4061    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4062
4063 static void
4064 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4065                        rtx *ptest, machine_mode *pmode)
4066 {
4067   enum rtx_code swapped = swap_condition (comparison);
4068   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4069   machine_mode orig_mode = GET_MODE (x);
4070   machine_mode mode;
4071   rtx true_rtx, false_rtx;
4072   rtx value, target, equiv;
4073   rtx_insn *insns;
4074   rtx libfunc = 0;
4075   bool reversed_p = false;
4076   scalar_int_mode cmp_mode = targetm.libgcc_cmp_return_mode ();
4077
4078   FOR_EACH_MODE_FROM (mode, orig_mode)
4079     {
4080       if (code_to_optab (comparison)
4081           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4082         break;
4083
4084       if (code_to_optab (swapped)
4085           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4086         {
4087           std::swap (x, y);
4088           comparison = swapped;
4089           break;
4090         }
4091
4092       if (code_to_optab (reversed)
4093           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4094         {
4095           comparison = reversed;
4096           reversed_p = true;
4097           break;
4098         }
4099     }
4100
4101   gcc_assert (mode != VOIDmode);
4102
4103   if (mode != orig_mode)
4104     {
4105       x = convert_to_mode (mode, x, 0);
4106       y = convert_to_mode (mode, y, 0);
4107     }
4108
4109   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4110      the RTL.  The allows the RTL optimizers to delete the libcall if the
4111      condition can be determined at compile-time.  */
4112   if (comparison == UNORDERED
4113       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4114     {
4115       true_rtx = const_true_rtx;
4116       false_rtx = const0_rtx;
4117     }
4118   else
4119     {
4120       switch (comparison)
4121         {
4122         case EQ:
4123           true_rtx = const0_rtx;
4124           false_rtx = const_true_rtx;
4125           break;
4126
4127         case NE:
4128           true_rtx = const_true_rtx;
4129           false_rtx = const0_rtx;
4130           break;
4131
4132         case GT:
4133           true_rtx = const1_rtx;
4134           false_rtx = const0_rtx;
4135           break;
4136
4137         case GE:
4138           true_rtx = const0_rtx;
4139           false_rtx = constm1_rtx;
4140           break;
4141
4142         case LT:
4143           true_rtx = constm1_rtx;
4144           false_rtx = const0_rtx;
4145           break;
4146
4147         case LE:
4148           true_rtx = const0_rtx;
4149           false_rtx = const1_rtx;
4150           break;
4151
4152         default:
4153           gcc_unreachable ();
4154         }
4155     }
4156
4157   if (comparison == UNORDERED)
4158     {
4159       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4160       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4161       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4162                                     temp, const_true_rtx, equiv);
4163     }
4164   else
4165     {
4166       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4167       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4168         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4169                                       equiv, true_rtx, false_rtx);
4170     }
4171
4172   start_sequence ();
4173   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4174                                    cmp_mode, 2, x, mode, y, mode);
4175   insns = get_insns ();
4176   end_sequence ();
4177
4178   target = gen_reg_rtx (cmp_mode);
4179   emit_libcall_block (insns, target, value, equiv);
4180
4181   if (comparison == UNORDERED
4182       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4183       || reversed_p)
4184     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4185   else
4186     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4187
4188   *pmode = cmp_mode;
4189 }
4190 \f
4191 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4192
4193 void
4194 emit_indirect_jump (rtx loc)
4195 {
4196   if (!targetm.have_indirect_jump ())
4197     sorry ("indirect jumps are not available on this target");
4198   else
4199     {
4200       struct expand_operand ops[1];
4201       create_address_operand (&ops[0], loc);
4202       expand_jump_insn (targetm.code_for_indirect_jump, 1, ops);
4203       emit_barrier ();
4204     }
4205 }
4206 \f
4207
4208 /* Emit a conditional move instruction if the machine supports one for that
4209    condition and machine mode.
4210
4211    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4212    the mode to use should they be constants.  If it is VOIDmode, they cannot
4213    both be constants.
4214
4215    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4216    should be stored there.  MODE is the mode to use should they be constants.
4217    If it is VOIDmode, they cannot both be constants.
4218
4219    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4220    is not supported.  */
4221
4222 rtx
4223 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4224                        machine_mode cmode, rtx op2, rtx op3,
4225                        machine_mode mode, int unsignedp)
4226 {
4227   rtx comparison;
4228   rtx_insn *last;
4229   enum insn_code icode;
4230   enum rtx_code reversed;
4231
4232   /* If the two source operands are identical, that's just a move.  */
4233
4234   if (rtx_equal_p (op2, op3))
4235     {
4236       if (!target)
4237         target = gen_reg_rtx (mode);
4238
4239       emit_move_insn (target, op3);
4240       return target;
4241     }
4242
4243   /* If one operand is constant, make it the second one.  Only do this
4244      if the other operand is not constant as well.  */
4245
4246   if (swap_commutative_operands_p (op0, op1))
4247     {
4248       std::swap (op0, op1);
4249       code = swap_condition (code);
4250     }
4251
4252   /* get_condition will prefer to generate LT and GT even if the old
4253      comparison was against zero, so undo that canonicalization here since
4254      comparisons against zero are cheaper.  */
4255   if (code == LT && op1 == const1_rtx)
4256     code = LE, op1 = const0_rtx;
4257   else if (code == GT && op1 == constm1_rtx)
4258     code = GE, op1 = const0_rtx;
4259
4260   if (cmode == VOIDmode)
4261     cmode = GET_MODE (op0);
4262
4263   enum rtx_code orig_code = code;
4264   bool swapped = false;
4265   if (swap_commutative_operands_p (op2, op3)
4266       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4267           != UNKNOWN))
4268     {
4269       std::swap (op2, op3);
4270       code = reversed;
4271       swapped = true;
4272     }
4273
4274   if (mode == VOIDmode)
4275     mode = GET_MODE (op2);
4276
4277   icode = direct_optab_handler (movcc_optab, mode);
4278
4279   if (icode == CODE_FOR_nothing)
4280     return NULL_RTX;
4281
4282   if (!target)
4283     target = gen_reg_rtx (mode);
4284
4285   for (int pass = 0; ; pass++)
4286     {
4287       code = unsignedp ? unsigned_condition (code) : code;
4288       comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4289
4290       /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4291          punt and let the caller figure out how best to deal with this
4292          situation.  */
4293       if (COMPARISON_P (comparison))
4294         {
4295           saved_pending_stack_adjust save;
4296           save_pending_stack_adjust (&save);
4297           last = get_last_insn ();
4298           do_pending_stack_adjust ();
4299           prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4300                             GET_CODE (comparison), NULL_RTX, unsignedp,
4301                             OPTAB_WIDEN, &comparison, &cmode);
4302           if (comparison)
4303             {
4304               struct expand_operand ops[4];
4305
4306               create_output_operand (&ops[0], target, mode);
4307               create_fixed_operand (&ops[1], comparison);
4308               create_input_operand (&ops[2], op2, mode);
4309               create_input_operand (&ops[3], op3, mode);
4310               if (maybe_expand_insn (icode, 4, ops))
4311                 {
4312                   if (ops[0].value != target)
4313                     convert_move (target, ops[0].value, false);
4314                   return target;
4315                 }
4316             }
4317           delete_insns_since (last);
4318           restore_pending_stack_adjust (&save);
4319         }
4320
4321       if (pass == 1)
4322         return NULL_RTX;
4323
4324       /* If the preferred op2/op3 order is not usable, retry with other
4325          operand order, perhaps it will expand successfully.  */
4326       if (swapped)
4327         code = orig_code;
4328       else if ((reversed = reversed_comparison_code_parts (orig_code, op0, op1,
4329                                                            NULL))
4330                != UNKNOWN)
4331         code = reversed;
4332       else
4333         return NULL_RTX;
4334       std::swap (op2, op3);
4335     }
4336 }
4337
4338
4339 /* Emit a conditional negate or bitwise complement using the
4340    negcc or notcc optabs if available.  Return NULL_RTX if such operations
4341    are not available.  Otherwise return the RTX holding the result.
4342    TARGET is the desired destination of the result.  COMP is the comparison
4343    on which to negate.  If COND is true move into TARGET the negation
4344    or bitwise complement of OP1.  Otherwise move OP2 into TARGET.
4345    CODE is either NEG or NOT.  MODE is the machine mode in which the
4346    operation is performed.  */
4347
4348 rtx
4349 emit_conditional_neg_or_complement (rtx target, rtx_code code,
4350                                      machine_mode mode, rtx cond, rtx op1,
4351                                      rtx op2)
4352 {
4353   optab op = unknown_optab;
4354   if (code == NEG)
4355     op = negcc_optab;
4356   else if (code == NOT)
4357     op = notcc_optab;
4358   else
4359     gcc_unreachable ();
4360
4361   insn_code icode = direct_optab_handler (op, mode);
4362
4363   if (icode == CODE_FOR_nothing)
4364     return NULL_RTX;
4365
4366   if (!target)
4367     target = gen_reg_rtx (mode);
4368
4369   rtx_insn *last = get_last_insn ();
4370   struct expand_operand ops[4];
4371
4372   create_output_operand (&ops[0], target, mode);
4373   create_fixed_operand (&ops[1], cond);
4374   create_input_operand (&ops[2], op1, mode);
4375   create_input_operand (&ops[3], op2, mode);
4376
4377   if (maybe_expand_insn (icode, 4, ops))
4378     {
4379       if (ops[0].value != target)
4380         convert_move (target, ops[0].value, false);
4381
4382       return target;
4383     }
4384   delete_insns_since (last);
4385   return NULL_RTX;
4386 }
4387
4388 /* Emit a conditional addition instruction if the machine supports one for that
4389    condition and machine mode.
4390
4391    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4392    the mode to use should they be constants.  If it is VOIDmode, they cannot
4393    both be constants.
4394
4395    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4396    should be stored there.  MODE is the mode to use should they be constants.
4397    If it is VOIDmode, they cannot both be constants.
4398
4399    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4400    is not supported.  */
4401
4402 rtx
4403 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4404                       machine_mode cmode, rtx op2, rtx op3,
4405                       machine_mode mode, int unsignedp)
4406 {
4407   rtx comparison;
4408   rtx_insn *last;
4409   enum insn_code icode;
4410
4411   /* If one operand is constant, make it the second one.  Only do this
4412      if the other operand is not constant as well.  */
4413
4414   if (swap_commutative_operands_p (op0, op1))
4415     {
4416       std::swap (op0, op1);
4417       code = swap_condition (code);
4418     }
4419
4420   /* get_condition will prefer to generate LT and GT even if the old
4421      comparison was against zero, so undo that canonicalization here since
4422      comparisons against zero are cheaper.  */
4423   if (code == LT && op1 == const1_rtx)
4424     code = LE, op1 = const0_rtx;
4425   else if (code == GT && op1 == constm1_rtx)
4426     code = GE, op1 = const0_rtx;
4427
4428   if (cmode == VOIDmode)
4429     cmode = GET_MODE (op0);
4430
4431   if (mode == VOIDmode)
4432     mode = GET_MODE (op2);
4433
4434   icode = optab_handler (addcc_optab, mode);
4435
4436   if (icode == CODE_FOR_nothing)
4437     return 0;
4438
4439   if (!target)
4440     target = gen_reg_rtx (mode);
4441
4442   code = unsignedp ? unsigned_condition (code) : code;
4443   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4444
4445   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4446      return NULL and let the caller figure out how best to deal with this
4447      situation.  */
4448   if (!COMPARISON_P (comparison))
4449     return NULL_RTX;
4450
4451   do_pending_stack_adjust ();
4452   last = get_last_insn ();
4453   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4454                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4455                     &comparison, &cmode);
4456   if (comparison)
4457     {
4458       struct expand_operand ops[4];
4459
4460       create_output_operand (&ops[0], target, mode);
4461       create_fixed_operand (&ops[1], comparison);
4462       create_input_operand (&ops[2], op2, mode);
4463       create_input_operand (&ops[3], op3, mode);
4464       if (maybe_expand_insn (icode, 4, ops))
4465         {
4466           if (ops[0].value != target)
4467             convert_move (target, ops[0].value, false);
4468           return target;
4469         }
4470     }
4471   delete_insns_since (last);
4472   return NULL_RTX;
4473 }
4474 \f
4475 /* These functions attempt to generate an insn body, rather than
4476    emitting the insn, but if the gen function already emits them, we
4477    make no attempt to turn them back into naked patterns.  */
4478
4479 /* Generate and return an insn body to add Y to X.  */
4480
4481 rtx_insn *
4482 gen_add2_insn (rtx x, rtx y)
4483 {
4484   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4485
4486   gcc_assert (insn_operand_matches (icode, 0, x));
4487   gcc_assert (insn_operand_matches (icode, 1, x));
4488   gcc_assert (insn_operand_matches (icode, 2, y));
4489
4490   return GEN_FCN (icode) (x, x, y);
4491 }
4492
4493 /* Generate and return an insn body to add r1 and c,
4494    storing the result in r0.  */
4495
4496 rtx_insn *
4497 gen_add3_insn (rtx r0, rtx r1, rtx c)
4498 {
4499   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4500
4501   if (icode == CODE_FOR_nothing
4502       || !insn_operand_matches (icode, 0, r0)
4503       || !insn_operand_matches (icode, 1, r1)
4504       || !insn_operand_matches (icode, 2, c))
4505     return NULL;
4506
4507   return GEN_FCN (icode) (r0, r1, c);
4508 }
4509
4510 int
4511 have_add2_insn (rtx x, rtx y)
4512 {
4513   enum insn_code icode;
4514
4515   gcc_assert (GET_MODE (x) != VOIDmode);
4516
4517   icode = optab_handler (add_optab, GET_MODE (x));
4518
4519   if (icode == CODE_FOR_nothing)
4520     return 0;
4521
4522   if (!insn_operand_matches (icode, 0, x)
4523       || !insn_operand_matches (icode, 1, x)
4524       || !insn_operand_matches (icode, 2, y))
4525     return 0;
4526
4527   return 1;
4528 }
4529
4530 /* Generate and return an insn body to add Y to X.  */
4531
4532 rtx_insn *
4533 gen_addptr3_insn (rtx x, rtx y, rtx z)
4534 {
4535   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4536
4537   gcc_assert (insn_operand_matches (icode, 0, x));
4538   gcc_assert (insn_operand_matches (icode, 1, y));
4539   gcc_assert (insn_operand_matches (icode, 2, z));
4540
4541   return GEN_FCN (icode) (x, y, z);
4542 }
4543
4544 /* Return true if the target implements an addptr pattern and X, Y,
4545    and Z are valid for the pattern predicates.  */
4546
4547 int
4548 have_addptr3_insn (rtx x, rtx y, rtx z)
4549 {
4550   enum insn_code icode;
4551
4552   gcc_assert (GET_MODE (x) != VOIDmode);
4553
4554   icode = optab_handler (addptr3_optab, GET_MODE (x));
4555
4556   if (icode == CODE_FOR_nothing)
4557     return 0;
4558
4559   if (!insn_operand_matches (icode, 0, x)
4560       || !insn_operand_matches (icode, 1, y)
4561       || !insn_operand_matches (icode, 2, z))
4562     return 0;
4563
4564   return 1;
4565 }
4566
4567 /* Generate and return an insn body to subtract Y from X.  */
4568
4569 rtx_insn *
4570 gen_sub2_insn (rtx x, rtx y)
4571 {
4572   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4573
4574   gcc_assert (insn_operand_matches (icode, 0, x));
4575   gcc_assert (insn_operand_matches (icode, 1, x));
4576   gcc_assert (insn_operand_matches (icode, 2, y));
4577
4578   return GEN_FCN (icode) (x, x, y);
4579 }
4580
4581 /* Generate and return an insn body to subtract r1 and c,
4582    storing the result in r0.  */
4583
4584 rtx_insn *
4585 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4586 {
4587   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4588
4589   if (icode == CODE_FOR_nothing
4590       || !insn_operand_matches (icode, 0, r0)
4591       || !insn_operand_matches (icode, 1, r1)
4592       || !insn_operand_matches (icode, 2, c))
4593     return NULL;
4594
4595   return GEN_FCN (icode) (r0, r1, c);
4596 }
4597
4598 int
4599 have_sub2_insn (rtx x, rtx y)
4600 {
4601   enum insn_code icode;
4602
4603   gcc_assert (GET_MODE (x) != VOIDmode);
4604
4605   icode = optab_handler (sub_optab, GET_MODE (x));
4606
4607   if (icode == CODE_FOR_nothing)
4608     return 0;
4609
4610   if (!insn_operand_matches (icode, 0, x)
4611       || !insn_operand_matches (icode, 1, x)
4612       || !insn_operand_matches (icode, 2, y))
4613     return 0;
4614
4615   return 1;
4616 }
4617 \f
4618 /* Generate the body of an insn to extend Y (with mode MFROM)
4619    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4620
4621 rtx_insn *
4622 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4623                  machine_mode mfrom, int unsignedp)
4624 {
4625   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4626   return GEN_FCN (icode) (x, y);
4627 }
4628 \f
4629 /* Generate code to convert FROM to floating point
4630    and store in TO.  FROM must be fixed point and not VOIDmode.
4631    UNSIGNEDP nonzero means regard FROM as unsigned.
4632    Normally this is done by correcting the final value
4633    if it is negative.  */
4634
4635 void
4636 expand_float (rtx to, rtx from, int unsignedp)
4637 {
4638   enum insn_code icode;
4639   rtx target = to;
4640   machine_mode fmode, imode;
4641   bool can_do_signed = false;
4642
4643   /* Crash now, because we won't be able to decide which mode to use.  */
4644   gcc_assert (GET_MODE (from) != VOIDmode);
4645
4646   /* Look for an insn to do the conversion.  Do it in the specified
4647      modes if possible; otherwise convert either input, output or both to
4648      wider mode.  If the integer mode is wider than the mode of FROM,
4649      we can do the conversion signed even if the input is unsigned.  */
4650
4651   FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4652     FOR_EACH_MODE_FROM (imode, GET_MODE (from))
4653       {
4654         int doing_unsigned = unsignedp;
4655
4656         if (fmode != GET_MODE (to)
4657             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
4658           continue;
4659
4660         icode = can_float_p (fmode, imode, unsignedp);
4661         if (icode == CODE_FOR_nothing && unsignedp)
4662           {
4663             enum insn_code scode = can_float_p (fmode, imode, 0);
4664             if (scode != CODE_FOR_nothing)
4665               can_do_signed = true;
4666             if (imode != GET_MODE (from))
4667               icode = scode, doing_unsigned = 0;
4668           }
4669
4670         if (icode != CODE_FOR_nothing)
4671           {
4672             if (imode != GET_MODE (from))
4673               from = convert_to_mode (imode, from, unsignedp);
4674
4675             if (fmode != GET_MODE (to))
4676               target = gen_reg_rtx (fmode);
4677
4678             emit_unop_insn (icode, target, from,
4679                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
4680
4681             if (target != to)
4682               convert_move (to, target, 0);
4683             return;
4684           }
4685       }
4686
4687   /* Unsigned integer, and no way to convert directly.  Convert as signed,
4688      then unconditionally adjust the result.  */
4689   if (unsignedp && can_do_signed)
4690     {
4691       rtx_code_label *label = gen_label_rtx ();
4692       rtx temp;
4693       REAL_VALUE_TYPE offset;
4694
4695       /* Look for a usable floating mode FMODE wider than the source and at
4696          least as wide as the target.  Using FMODE will avoid rounding woes
4697          with unsigned values greater than the signed maximum value.  */
4698
4699       FOR_EACH_MODE_FROM (fmode, GET_MODE (to))
4700         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
4701             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
4702           break;
4703
4704       if (fmode == VOIDmode)
4705         {
4706           /* There is no such mode.  Pretend the target is wide enough.  */
4707           fmode = GET_MODE (to);
4708
4709           /* Avoid double-rounding when TO is narrower than FROM.  */
4710           if ((significand_size (fmode) + 1)
4711               < GET_MODE_PRECISION (GET_MODE (from)))
4712             {
4713               rtx temp1;
4714               rtx_code_label *neglabel = gen_label_rtx ();
4715
4716               /* Don't use TARGET if it isn't a register, is a hard register,
4717                  or is the wrong mode.  */
4718               if (!REG_P (target)
4719                   || REGNO (target) < FIRST_PSEUDO_REGISTER
4720                   || GET_MODE (target) != fmode)
4721                 target = gen_reg_rtx (fmode);
4722
4723               imode = GET_MODE (from);
4724               do_pending_stack_adjust ();
4725
4726               /* Test whether the sign bit is set.  */
4727               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
4728                                        0, neglabel);
4729
4730               /* The sign bit is not set.  Convert as signed.  */
4731               expand_float (target, from, 0);
4732               emit_jump_insn (targetm.gen_jump (label));
4733               emit_barrier ();
4734
4735               /* The sign bit is set.
4736                  Convert to a usable (positive signed) value by shifting right
4737                  one bit, while remembering if a nonzero bit was shifted
4738                  out; i.e., compute  (from & 1) | (from >> 1).  */
4739
4740               emit_label (neglabel);
4741               temp = expand_binop (imode, and_optab, from, const1_rtx,
4742                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
4743               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
4744               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
4745                                    OPTAB_LIB_WIDEN);
4746               expand_float (target, temp, 0);
4747
4748               /* Multiply by 2 to undo the shift above.  */
4749               temp = expand_binop (fmode, add_optab, target, target,
4750                                    target, 0, OPTAB_LIB_WIDEN);
4751               if (temp != target)
4752                 emit_move_insn (target, temp);
4753
4754               do_pending_stack_adjust ();
4755               emit_label (label);
4756               goto done;
4757             }
4758         }
4759
4760       /* If we are about to do some arithmetic to correct for an
4761          unsigned operand, do it in a pseudo-register.  */
4762
4763       if (GET_MODE (to) != fmode
4764           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
4765         target = gen_reg_rtx (fmode);
4766
4767       /* Convert as signed integer to floating.  */
4768       expand_float (target, from, 0);
4769
4770       /* If FROM is negative (and therefore TO is negative),
4771          correct its value by 2**bitwidth.  */
4772
4773       do_pending_stack_adjust ();
4774       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
4775                                0, label);
4776
4777
4778       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
4779       temp = expand_binop (fmode, add_optab, target,
4780                            const_double_from_real_value (offset, fmode),
4781                            target, 0, OPTAB_LIB_WIDEN);
4782       if (temp != target)
4783         emit_move_insn (target, temp);
4784
4785       do_pending_stack_adjust ();
4786       emit_label (label);
4787       goto done;
4788     }
4789
4790   /* No hardware instruction available; call a library routine.  */
4791     {
4792       rtx libfunc;
4793       rtx_insn *insns;
4794       rtx value;
4795       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
4796
4797       if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_PRECISION (SImode))
4798         from = convert_to_mode (SImode, from, unsignedp);
4799
4800       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4801       gcc_assert (libfunc);
4802
4803       start_sequence ();
4804
4805       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4806                                        GET_MODE (to), 1, from,
4807                                        GET_MODE (from));
4808       insns = get_insns ();
4809       end_sequence ();
4810
4811       emit_libcall_block (insns, target, value,
4812                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
4813                                          GET_MODE (to), from));
4814     }
4815
4816  done:
4817
4818   /* Copy result to requested destination
4819      if we have been computing in a temp location.  */
4820
4821   if (target != to)
4822     {
4823       if (GET_MODE (target) == GET_MODE (to))
4824         emit_move_insn (to, target);
4825       else
4826         convert_move (to, target, 0);
4827     }
4828 }
4829 \f
4830 /* Generate code to convert FROM to fixed point and store in TO.  FROM
4831    must be floating point.  */
4832
4833 void
4834 expand_fix (rtx to, rtx from, int unsignedp)
4835 {
4836   enum insn_code icode;
4837   rtx target = to;
4838   machine_mode fmode, imode;
4839   bool must_trunc = false;
4840
4841   /* We first try to find a pair of modes, one real and one integer, at
4842      least as wide as FROM and TO, respectively, in which we can open-code
4843      this conversion.  If the integer mode is wider than the mode of TO,
4844      we can do the conversion either signed or unsigned.  */
4845
4846   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4847     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
4848       {
4849         int doing_unsigned = unsignedp;
4850
4851         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
4852         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
4853           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
4854
4855         if (icode != CODE_FOR_nothing)
4856           {
4857             rtx_insn *last = get_last_insn ();
4858             if (fmode != GET_MODE (from))
4859               from = convert_to_mode (fmode, from, 0);
4860
4861             if (must_trunc)
4862               {
4863                 rtx temp = gen_reg_rtx (GET_MODE (from));
4864                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
4865                                     temp, 0);
4866               }
4867
4868             if (imode != GET_MODE (to))
4869               target = gen_reg_rtx (imode);
4870
4871             if (maybe_emit_unop_insn (icode, target, from,
4872                                       doing_unsigned ? UNSIGNED_FIX : FIX))
4873               {
4874                 if (target != to)
4875                   convert_move (to, target, unsignedp);
4876                 return;
4877               }
4878             delete_insns_since (last);
4879           }
4880       }
4881
4882   /* For an unsigned conversion, there is one more way to do it.
4883      If we have a signed conversion, we generate code that compares
4884      the real value to the largest representable positive number.  If if
4885      is smaller, the conversion is done normally.  Otherwise, subtract
4886      one plus the highest signed number, convert, and add it back.
4887
4888      We only need to check all real modes, since we know we didn't find
4889      anything with a wider integer mode.
4890
4891      This code used to extend FP value into mode wider than the destination.
4892      This is needed for decimal float modes which cannot accurately
4893      represent one plus the highest signed number of the same size, but
4894      not for binary modes.  Consider, for instance conversion from SFmode
4895      into DImode.
4896
4897      The hot path through the code is dealing with inputs smaller than 2^63
4898      and doing just the conversion, so there is no bits to lose.
4899
4900      In the other path we know the value is positive in the range 2^63..2^64-1
4901      inclusive.  (as for other input overflow happens and result is undefined)
4902      So we know that the most important bit set in mantissa corresponds to
4903      2^63.  The subtraction of 2^63 should not generate any rounding as it
4904      simply clears out that bit.  The rest is trivial.  */
4905
4906   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
4907     FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
4908       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
4909           && (!DECIMAL_FLOAT_MODE_P (fmode)
4910               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
4911         {
4912           int bitsize;
4913           REAL_VALUE_TYPE offset;
4914           rtx limit;
4915           rtx_code_label *lab1, *lab2;
4916           rtx_insn *insn;
4917
4918           bitsize = GET_MODE_PRECISION (GET_MODE (to));
4919           real_2expN (&offset, bitsize - 1, fmode);
4920           limit = const_double_from_real_value (offset, fmode);
4921           lab1 = gen_label_rtx ();
4922           lab2 = gen_label_rtx ();
4923
4924           if (fmode != GET_MODE (from))
4925             from = convert_to_mode (fmode, from, 0);
4926
4927           /* See if we need to do the subtraction.  */
4928           do_pending_stack_adjust ();
4929           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
4930                                    0, lab1);
4931
4932           /* If not, do the signed "fix" and branch around fixup code.  */
4933           expand_fix (to, from, 0);
4934           emit_jump_insn (targetm.gen_jump (lab2));
4935           emit_barrier ();
4936
4937           /* Otherwise, subtract 2**(N-1), convert to signed number,
4938              then add 2**(N-1).  Do the addition using XOR since this
4939              will often generate better code.  */
4940           emit_label (lab1);
4941           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
4942                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
4943           expand_fix (to, target, 0);
4944           target = expand_binop (GET_MODE (to), xor_optab, to,
4945                                  gen_int_mode
4946                                  (HOST_WIDE_INT_1 << (bitsize - 1),
4947                                   GET_MODE (to)),
4948                                  to, 1, OPTAB_LIB_WIDEN);
4949
4950           if (target != to)
4951             emit_move_insn (to, target);
4952
4953           emit_label (lab2);
4954
4955           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
4956             {
4957               /* Make a place for a REG_NOTE and add it.  */
4958               insn = emit_move_insn (to, to);
4959               set_dst_reg_note (insn, REG_EQUAL,
4960                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
4961                                                copy_rtx (from)),
4962                                 to);
4963             }
4964
4965           return;
4966         }
4967
4968   /* We can't do it with an insn, so use a library call.  But first ensure
4969      that the mode of TO is at least as wide as SImode, since those are the
4970      only library calls we know about.  */
4971
4972   if (GET_MODE_PRECISION (GET_MODE (to)) < GET_MODE_PRECISION (SImode))
4973     {
4974       target = gen_reg_rtx (SImode);
4975
4976       expand_fix (target, from, unsignedp);
4977     }
4978   else
4979     {
4980       rtx_insn *insns;
4981       rtx value;
4982       rtx libfunc;
4983
4984       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
4985       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
4986       gcc_assert (libfunc);
4987
4988       start_sequence ();
4989
4990       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4991                                        GET_MODE (to), 1, from,
4992                                        GET_MODE (from));
4993       insns = get_insns ();
4994       end_sequence ();
4995
4996       emit_libcall_block (insns, target, value,
4997                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
4998                                          GET_MODE (to), from));
4999     }
5000
5001   if (target != to)
5002     {
5003       if (GET_MODE (to) == GET_MODE (target))
5004         emit_move_insn (to, target);
5005       else
5006         convert_move (to, target, 0);
5007     }
5008 }
5009
5010
5011 /* Promote integer arguments for a libcall if necessary.
5012    emit_library_call_value cannot do the promotion because it does not
5013    know if it should do a signed or unsigned promotion.  This is because
5014    there are no tree types defined for libcalls.  */
5015
5016 static rtx
5017 prepare_libcall_arg (rtx arg, int uintp)
5018 {
5019   scalar_int_mode mode;
5020   machine_mode arg_mode;
5021   if (is_a <scalar_int_mode> (GET_MODE (arg), &mode))
5022     {
5023       /*  If we need to promote the integer function argument we need to do
5024           it here instead of inside emit_library_call_value because in
5025           emit_library_call_value we don't know if we should do a signed or
5026           unsigned promotion.  */
5027
5028       int unsigned_p = 0;
5029       arg_mode = promote_function_mode (NULL_TREE, mode,
5030                                         &unsigned_p, NULL_TREE, 0);
5031       if (arg_mode != mode)
5032         return convert_to_mode (arg_mode, arg, uintp);
5033     }
5034     return arg;
5035 }
5036
5037 /* Generate code to convert FROM or TO a fixed-point.
5038    If UINTP is true, either TO or FROM is an unsigned integer.
5039    If SATP is true, we need to saturate the result.  */
5040
5041 void
5042 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5043 {
5044   machine_mode to_mode = GET_MODE (to);
5045   machine_mode from_mode = GET_MODE (from);
5046   convert_optab tab;
5047   enum rtx_code this_code;
5048   enum insn_code code;
5049   rtx_insn *insns;
5050   rtx value;
5051   rtx libfunc;
5052
5053   if (to_mode == from_mode)
5054     {
5055       emit_move_insn (to, from);
5056       return;
5057     }
5058
5059   if (uintp)
5060     {
5061       tab = satp ? satfractuns_optab : fractuns_optab;
5062       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5063     }
5064   else
5065     {
5066       tab = satp ? satfract_optab : fract_optab;
5067       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5068     }
5069   code = convert_optab_handler (tab, to_mode, from_mode);
5070   if (code != CODE_FOR_nothing)
5071     {
5072       emit_unop_insn (code, to, from, this_code);
5073       return;
5074     }
5075
5076   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5077   gcc_assert (libfunc);
5078
5079   from = prepare_libcall_arg (from, uintp);
5080   from_mode = GET_MODE (from);
5081
5082   start_sequence ();
5083   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5084                                    1, from, from_mode);
5085   insns = get_insns ();
5086   end_sequence ();
5087
5088   emit_libcall_block (insns, to, value,
5089                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5090 }
5091
5092 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5093    must be floating point, TO must be signed.  Use the conversion optab
5094    TAB to do the conversion.  */
5095
5096 bool
5097 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5098 {
5099   enum insn_code icode;
5100   rtx target = to;
5101   machine_mode fmode, imode;
5102
5103   /* We first try to find a pair of modes, one real and one integer, at
5104      least as wide as FROM and TO, respectively, in which we can open-code
5105      this conversion.  If the integer mode is wider than the mode of TO,
5106      we can do the conversion either signed or unsigned.  */
5107
5108   FOR_EACH_MODE_FROM (fmode, GET_MODE (from))
5109     FOR_EACH_MODE_FROM (imode, GET_MODE (to))
5110       {
5111         icode = convert_optab_handler (tab, imode, fmode);
5112         if (icode != CODE_FOR_nothing)
5113           {
5114             rtx_insn *last = get_last_insn ();
5115             if (fmode != GET_MODE (from))
5116               from = convert_to_mode (fmode, from, 0);
5117
5118             if (imode != GET_MODE (to))
5119               target = gen_reg_rtx (imode);
5120
5121             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5122               {
5123                 delete_insns_since (last);
5124                 continue;
5125               }
5126             if (target != to)
5127               convert_move (to, target, 0);
5128             return true;
5129           }
5130       }
5131
5132   return false;
5133 }
5134 \f
5135 /* Report whether we have an instruction to perform the operation
5136    specified by CODE on operands of mode MODE.  */
5137 int
5138 have_insn_for (enum rtx_code code, machine_mode mode)
5139 {
5140   return (code_to_optab (code)
5141           && (optab_handler (code_to_optab (code), mode)
5142               != CODE_FOR_nothing));
5143 }
5144
5145 /* Print information about the current contents of the optabs on
5146    STDERR.  */
5147
5148 DEBUG_FUNCTION void
5149 debug_optab_libfuncs (void)
5150 {
5151   int i, j, k;
5152
5153   /* Dump the arithmetic optabs.  */
5154   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
5155     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5156       {
5157         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
5158         if (l)
5159           {
5160             gcc_assert (GET_CODE (l) == SYMBOL_REF);
5161             fprintf (stderr, "%s\t%s:\t%s\n",
5162                      GET_RTX_NAME (optab_to_code ((optab) i)),
5163                      GET_MODE_NAME (j),
5164                      XSTR (l, 0));
5165           }
5166       }
5167
5168   /* Dump the conversion optabs.  */
5169   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
5170     for (j = 0; j < NUM_MACHINE_MODES; ++j)
5171       for (k = 0; k < NUM_MACHINE_MODES; ++k)
5172         {
5173           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
5174                                          (machine_mode) k);
5175           if (l)
5176             {
5177               gcc_assert (GET_CODE (l) == SYMBOL_REF);
5178               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
5179                        GET_RTX_NAME (optab_to_code ((optab) i)),
5180                        GET_MODE_NAME (j),
5181                        GET_MODE_NAME (k),
5182                        XSTR (l, 0));
5183             }
5184         }
5185 }
5186
5187 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
5188    CODE.  Return 0 on failure.  */
5189
5190 rtx_insn *
5191 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
5192 {
5193   machine_mode mode = GET_MODE (op1);
5194   enum insn_code icode;
5195   rtx_insn *insn;
5196   rtx trap_rtx;
5197
5198   if (mode == VOIDmode)
5199     return 0;
5200
5201   icode = optab_handler (ctrap_optab, mode);
5202   if (icode == CODE_FOR_nothing)
5203     return 0;
5204
5205   /* Some targets only accept a zero trap code.  */
5206   if (!insn_operand_matches (icode, 3, tcode))
5207     return 0;
5208
5209   do_pending_stack_adjust ();
5210   start_sequence ();
5211   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
5212                     &trap_rtx, &mode);
5213   if (!trap_rtx)
5214     insn = NULL;
5215   else
5216     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
5217                             tcode);
5218
5219   /* If that failed, then give up.  */
5220   if (insn == 0)
5221     {
5222       end_sequence ();
5223       return 0;
5224     }
5225
5226   emit_insn (insn);
5227   insn = get_insns ();
5228   end_sequence ();
5229   return insn;
5230 }
5231
5232 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
5233    or unsigned operation code.  */
5234
5235 enum rtx_code
5236 get_rtx_code (enum tree_code tcode, bool unsignedp)
5237 {
5238   enum rtx_code code;
5239   switch (tcode)
5240     {
5241     case EQ_EXPR:
5242       code = EQ;
5243       break;
5244     case NE_EXPR:
5245       code = NE;
5246       break;
5247     case LT_EXPR:
5248       code = unsignedp ? LTU : LT;
5249       break;
5250     case LE_EXPR:
5251       code = unsignedp ? LEU : LE;
5252       break;
5253     case GT_EXPR:
5254       code = unsignedp ? GTU : GT;
5255       break;
5256     case GE_EXPR:
5257       code = unsignedp ? GEU : GE;
5258       break;
5259
5260     case UNORDERED_EXPR:
5261       code = UNORDERED;
5262       break;
5263     case ORDERED_EXPR:
5264       code = ORDERED;
5265       break;
5266     case UNLT_EXPR:
5267       code = UNLT;
5268       break;
5269     case UNLE_EXPR:
5270       code = UNLE;
5271       break;
5272     case UNGT_EXPR:
5273       code = UNGT;
5274       break;
5275     case UNGE_EXPR:
5276       code = UNGE;
5277       break;
5278     case UNEQ_EXPR:
5279       code = UNEQ;
5280       break;
5281     case LTGT_EXPR:
5282       code = LTGT;
5283       break;
5284
5285     case BIT_AND_EXPR:
5286       code = AND;
5287       break;
5288
5289     case BIT_IOR_EXPR:
5290       code = IOR;
5291       break;
5292
5293     default:
5294       gcc_unreachable ();
5295     }
5296   return code;
5297 }
5298
5299 /* Return a comparison rtx of mode CMP_MODE for COND.  Use UNSIGNEDP to
5300    select signed or unsigned operators.  OPNO holds the index of the
5301    first comparison operand for insn ICODE.  Do not generate the
5302    compare instruction itself.  */
5303
5304 static rtx
5305 vector_compare_rtx (machine_mode cmp_mode, enum tree_code tcode,
5306                     tree t_op0, tree t_op1, bool unsignedp,
5307                     enum insn_code icode, unsigned int opno)
5308 {
5309   struct expand_operand ops[2];
5310   rtx rtx_op0, rtx_op1;
5311   machine_mode m0, m1;
5312   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
5313
5314   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
5315
5316   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
5317      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
5318      cases, use the original mode.  */
5319   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
5320                          EXPAND_STACK_PARM);
5321   m0 = GET_MODE (rtx_op0);
5322   if (m0 == VOIDmode)
5323     m0 = TYPE_MODE (TREE_TYPE (t_op0));
5324
5325   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
5326                          EXPAND_STACK_PARM);
5327   m1 = GET_MODE (rtx_op1);
5328   if (m1 == VOIDmode)
5329     m1 = TYPE_MODE (TREE_TYPE (t_op1));
5330
5331   create_input_operand (&ops[0], rtx_op0, m0);
5332   create_input_operand (&ops[1], rtx_op1, m1);
5333   if (!maybe_legitimize_operands (icode, opno, 2, ops))
5334     gcc_unreachable ();
5335   return gen_rtx_fmt_ee (rcode, cmp_mode, ops[0].value, ops[1].value);
5336 }
5337
5338 /* Checks if vec_perm mask SEL is a constant equivalent to a shift of the first
5339    vec_perm operand, assuming the second operand is a constant vector of zeroes.
5340    Return the shift distance in bits if so, or NULL_RTX if the vec_perm is not a
5341    shift.  */
5342 static rtx
5343 shift_amt_for_vec_perm_mask (rtx sel)
5344 {
5345   unsigned int i, first, nelt = GET_MODE_NUNITS (GET_MODE (sel));
5346   unsigned int bitsize = GET_MODE_UNIT_BITSIZE (GET_MODE (sel));
5347
5348   if (GET_CODE (sel) != CONST_VECTOR)
5349     return NULL_RTX;
5350
5351   first = INTVAL (CONST_VECTOR_ELT (sel, 0));
5352   if (first >= nelt)
5353     return NULL_RTX;
5354   for (i = 1; i < nelt; i++)
5355     {
5356       int idx = INTVAL (CONST_VECTOR_ELT (sel, i));
5357       unsigned int expected = i + first;
5358       /* Indices into the second vector are all equivalent.  */
5359       if (idx < 0 || (MIN (nelt, (unsigned) idx) != MIN (nelt, expected)))
5360         return NULL_RTX;
5361     }
5362
5363   return GEN_INT (first * bitsize);
5364 }
5365
5366 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
5367
5368 static rtx
5369 expand_vec_perm_1 (enum insn_code icode, rtx target,
5370                    rtx v0, rtx v1, rtx sel)
5371 {
5372   machine_mode tmode = GET_MODE (target);
5373   machine_mode smode = GET_MODE (sel);
5374   struct expand_operand ops[4];
5375
5376   create_output_operand (&ops[0], target, tmode);
5377   create_input_operand (&ops[3], sel, smode);
5378
5379   /* Make an effort to preserve v0 == v1.  The target expander is able to
5380      rely on this to determine if we're permuting a single input operand.  */
5381   if (rtx_equal_p (v0, v1))
5382     {
5383       if (!insn_operand_matches (icode, 1, v0))
5384         v0 = force_reg (tmode, v0);
5385       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
5386       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
5387
5388       create_fixed_operand (&ops[1], v0);
5389       create_fixed_operand (&ops[2], v0);
5390     }
5391   else
5392     {
5393       create_input_operand (&ops[1], v0, tmode);
5394       create_input_operand (&ops[2], v1, tmode);
5395     }
5396
5397   if (maybe_expand_insn (icode, 4, ops))
5398     return ops[0].value;
5399   return NULL_RTX;
5400 }
5401
5402 /* Generate instructions for vec_perm optab given its mode
5403    and three operands.  */
5404
5405 rtx
5406 expand_vec_perm (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
5407 {
5408   enum insn_code icode;
5409   machine_mode qimode;
5410   unsigned int i, w, e, u;
5411   rtx tmp, sel_qi = NULL;
5412   rtvec vec;
5413
5414   if (!target || GET_MODE (target) != mode)
5415     target = gen_reg_rtx (mode);
5416
5417   w = GET_MODE_SIZE (mode);
5418   e = GET_MODE_NUNITS (mode);
5419   u = GET_MODE_UNIT_SIZE (mode);
5420
5421   /* Set QIMODE to a different vector mode with byte elements.
5422      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
5423   qimode = VOIDmode;
5424   if (GET_MODE_INNER (mode) != QImode)
5425     {
5426       qimode = mode_for_vector (QImode, w);
5427       if (!VECTOR_MODE_P (qimode))
5428         qimode = VOIDmode;
5429     }
5430
5431   /* If the input is a constant, expand it specially.  */
5432   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
5433   if (GET_CODE (sel) == CONST_VECTOR)
5434     {
5435       /* See if this can be handled with a vec_shr.  We only do this if the
5436          second vector is all zeroes.  */
5437       enum insn_code shift_code = optab_handler (vec_shr_optab, mode);
5438       enum insn_code shift_code_qi = ((qimode != VOIDmode && qimode != mode)
5439                                       ? optab_handler (vec_shr_optab, qimode)
5440                                       : CODE_FOR_nothing);
5441       rtx shift_amt = NULL_RTX;
5442       if (v1 == CONST0_RTX (GET_MODE (v1))
5443           && (shift_code != CODE_FOR_nothing
5444               || shift_code_qi != CODE_FOR_nothing))
5445         {
5446           shift_amt = shift_amt_for_vec_perm_mask (sel);
5447           if (shift_amt)
5448             {
5449               struct expand_operand ops[3];
5450               if (shift_code != CODE_FOR_nothing)
5451                 {
5452                   create_output_operand (&ops[0], target, mode);
5453                   create_input_operand (&ops[1], v0, mode);
5454                   create_convert_operand_from_type (&ops[2], shift_amt,
5455                                                     sizetype);
5456                   if (maybe_expand_insn (shift_code, 3, ops))
5457                     return ops[0].value;
5458                 }
5459               if (shift_code_qi != CODE_FOR_nothing)
5460                 {
5461                   tmp = gen_reg_rtx (qimode);
5462                   create_output_operand (&ops[0], tmp, qimode);
5463                   create_input_operand (&ops[1], gen_lowpart (qimode, v0),
5464                                         qimode);
5465                   create_convert_operand_from_type (&ops[2], shift_amt,
5466                                                     sizetype);
5467                   if (maybe_expand_insn (shift_code_qi, 3, ops))
5468                     return gen_lowpart (mode, ops[0].value);
5469                 }
5470             }
5471         }
5472
5473       icode = direct_optab_handler (vec_perm_const_optab, mode);
5474       if (icode != CODE_FOR_nothing)
5475         {
5476           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5477           if (tmp)
5478             return tmp;
5479         }
5480
5481       /* Fall back to a constant byte-based permutation.  */
5482       if (qimode != VOIDmode)
5483         {
5484           vec = rtvec_alloc (w);
5485           for (i = 0; i < e; ++i)
5486             {
5487               unsigned int j, this_e;
5488
5489               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
5490               this_e &= 2 * e - 1;
5491               this_e *= u;
5492
5493               for (j = 0; j < u; ++j)
5494                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
5495             }
5496           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
5497
5498           icode = direct_optab_handler (vec_perm_const_optab, qimode);
5499           if (icode != CODE_FOR_nothing)
5500             {
5501               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5502               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5503                                        gen_lowpart (qimode, v1), sel_qi);
5504               if (tmp)
5505                 return gen_lowpart (mode, tmp);
5506             }
5507         }
5508     }
5509
5510   /* Otherwise expand as a fully variable permuation.  */
5511   icode = direct_optab_handler (vec_perm_optab, mode);
5512   if (icode != CODE_FOR_nothing)
5513     {
5514       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
5515       if (tmp)
5516         return tmp;
5517     }
5518
5519   /* As a special case to aid several targets, lower the element-based
5520      permutation to a byte-based permutation and try again.  */
5521   if (qimode == VOIDmode)
5522     return NULL_RTX;
5523   icode = direct_optab_handler (vec_perm_optab, qimode);
5524   if (icode == CODE_FOR_nothing)
5525     return NULL_RTX;
5526
5527   if (sel_qi == NULL)
5528     {
5529       /* Multiply each element by its byte size.  */
5530       machine_mode selmode = GET_MODE (sel);
5531       if (u == 2)
5532         sel = expand_simple_binop (selmode, PLUS, sel, sel,
5533                                    NULL, 0, OPTAB_DIRECT);
5534       else
5535         sel = expand_simple_binop (selmode, ASHIFT, sel,
5536                                    GEN_INT (exact_log2 (u)),
5537                                    NULL, 0, OPTAB_DIRECT);
5538       gcc_assert (sel != NULL);
5539
5540       /* Broadcast the low byte each element into each of its bytes.  */
5541       vec = rtvec_alloc (w);
5542       for (i = 0; i < w; ++i)
5543         {
5544           int this_e = i / u * u;
5545           if (BYTES_BIG_ENDIAN)
5546             this_e += u - 1;
5547           RTVEC_ELT (vec, i) = GEN_INT (this_e);
5548         }
5549       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5550       sel = gen_lowpart (qimode, sel);
5551       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
5552       gcc_assert (sel != NULL);
5553
5554       /* Add the byte offset to each byte element.  */
5555       /* Note that the definition of the indicies here is memory ordering,
5556          so there should be no difference between big and little endian.  */
5557       vec = rtvec_alloc (w);
5558       for (i = 0; i < w; ++i)
5559         RTVEC_ELT (vec, i) = GEN_INT (i % u);
5560       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
5561       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
5562                                     sel, 0, OPTAB_DIRECT);
5563       gcc_assert (sel_qi != NULL);
5564     }
5565
5566   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
5567   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
5568                            gen_lowpart (qimode, v1), sel_qi);
5569   if (tmp)
5570     tmp = gen_lowpart (mode, tmp);
5571   return tmp;
5572 }
5573
5574 /* Generate insns for a VEC_COND_EXPR with mask, given its TYPE and its
5575    three operands.  */
5576
5577 rtx
5578 expand_vec_cond_mask_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5579                            rtx target)
5580 {
5581   struct expand_operand ops[4];
5582   machine_mode mode = TYPE_MODE (vec_cond_type);
5583   machine_mode mask_mode = TYPE_MODE (TREE_TYPE (op0));
5584   enum insn_code icode = get_vcond_mask_icode (mode, mask_mode);
5585   rtx mask, rtx_op1, rtx_op2;
5586
5587   if (icode == CODE_FOR_nothing)
5588     return 0;
5589
5590   mask = expand_normal (op0);
5591   rtx_op1 = expand_normal (op1);
5592   rtx_op2 = expand_normal (op2);
5593
5594   mask = force_reg (mask_mode, mask);
5595   rtx_op1 = force_reg (GET_MODE (rtx_op1), rtx_op1);
5596
5597   create_output_operand (&ops[0], target, mode);
5598   create_input_operand (&ops[1], rtx_op1, mode);
5599   create_input_operand (&ops[2], rtx_op2, mode);
5600   create_input_operand (&ops[3], mask, mask_mode);
5601   expand_insn (icode, 4, ops);
5602
5603   return ops[0].value;
5604 }
5605
5606 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
5607    three operands.  */
5608
5609 rtx
5610 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
5611                       rtx target)
5612 {
5613   struct expand_operand ops[6];
5614   enum insn_code icode;
5615   rtx comparison, rtx_op1, rtx_op2;
5616   machine_mode mode = TYPE_MODE (vec_cond_type);
5617   machine_mode cmp_op_mode;
5618   bool unsignedp;
5619   tree op0a, op0b;
5620   enum tree_code tcode;
5621
5622   if (COMPARISON_CLASS_P (op0))
5623     {
5624       op0a = TREE_OPERAND (op0, 0);
5625       op0b = TREE_OPERAND (op0, 1);
5626       tcode = TREE_CODE (op0);
5627     }
5628   else
5629     {
5630       gcc_assert (VECTOR_BOOLEAN_TYPE_P (TREE_TYPE (op0)));
5631       if (get_vcond_mask_icode (mode, TYPE_MODE (TREE_TYPE (op0)))
5632           != CODE_FOR_nothing)
5633         return expand_vec_cond_mask_expr (vec_cond_type, op0, op1,
5634                                           op2, target);
5635       /* Fake op0 < 0.  */
5636       else
5637         {
5638           gcc_assert (GET_MODE_CLASS (TYPE_MODE (TREE_TYPE (op0)))
5639                       == MODE_VECTOR_INT);
5640           op0a = op0;
5641           op0b = build_zero_cst (TREE_TYPE (op0));
5642           tcode = LT_EXPR;
5643         }
5644     }
5645   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
5646   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5647
5648
5649   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
5650               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
5651
5652   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
5653   if (icode == CODE_FOR_nothing)
5654     {
5655       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5656         icode = get_vcond_eq_icode (mode, cmp_op_mode);
5657       if (icode == CODE_FOR_nothing)
5658         return 0;
5659     }
5660
5661   comparison = vector_compare_rtx (VOIDmode, tcode, op0a, op0b, unsignedp,
5662                                    icode, 4);
5663   rtx_op1 = expand_normal (op1);
5664   rtx_op2 = expand_normal (op2);
5665
5666   create_output_operand (&ops[0], target, mode);
5667   create_input_operand (&ops[1], rtx_op1, mode);
5668   create_input_operand (&ops[2], rtx_op2, mode);
5669   create_fixed_operand (&ops[3], comparison);
5670   create_fixed_operand (&ops[4], XEXP (comparison, 0));
5671   create_fixed_operand (&ops[5], XEXP (comparison, 1));
5672   expand_insn (icode, 6, ops);
5673   return ops[0].value;
5674 }
5675
5676 /* Generate insns for a vector comparison into a mask.  */
5677
5678 rtx
5679 expand_vec_cmp_expr (tree type, tree exp, rtx target)
5680 {
5681   struct expand_operand ops[4];
5682   enum insn_code icode;
5683   rtx comparison;
5684   machine_mode mask_mode = TYPE_MODE (type);
5685   machine_mode vmode;
5686   bool unsignedp;
5687   tree op0a, op0b;
5688   enum tree_code tcode;
5689
5690   op0a = TREE_OPERAND (exp, 0);
5691   op0b = TREE_OPERAND (exp, 1);
5692   tcode = TREE_CODE (exp);
5693
5694   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
5695   vmode = TYPE_MODE (TREE_TYPE (op0a));
5696
5697   icode = get_vec_cmp_icode (vmode, mask_mode, unsignedp);
5698   if (icode == CODE_FOR_nothing)
5699     {
5700       if (tcode == EQ_EXPR || tcode == NE_EXPR)
5701         icode = get_vec_cmp_eq_icode (vmode, mask_mode);
5702       if (icode == CODE_FOR_nothing)
5703         return 0;
5704     }
5705
5706   comparison = vector_compare_rtx (mask_mode, tcode, op0a, op0b,
5707                                    unsignedp, icode, 2);
5708   create_output_operand (&ops[0], target, mask_mode);
5709   create_fixed_operand (&ops[1], comparison);
5710   create_fixed_operand (&ops[2], XEXP (comparison, 0));
5711   create_fixed_operand (&ops[3], XEXP (comparison, 1));
5712   expand_insn (icode, 4, ops);
5713   return ops[0].value;
5714 }
5715
5716 /* Expand a highpart multiply.  */
5717
5718 rtx
5719 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
5720                       rtx target, bool uns_p)
5721 {
5722   struct expand_operand eops[3];
5723   enum insn_code icode;
5724   int method, i, nunits;
5725   machine_mode wmode;
5726   rtx m1, m2, perm;
5727   optab tab1, tab2;
5728   rtvec v;
5729
5730   method = can_mult_highpart_p (mode, uns_p);
5731   switch (method)
5732     {
5733     case 0:
5734       return NULL_RTX;
5735     case 1:
5736       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
5737       return expand_binop (mode, tab1, op0, op1, target, uns_p,
5738                            OPTAB_LIB_WIDEN);
5739     case 2:
5740       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
5741       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
5742       break;
5743     case 3:
5744       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
5745       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
5746       if (BYTES_BIG_ENDIAN)
5747         std::swap (tab1, tab2);
5748       break;
5749     default:
5750       gcc_unreachable ();
5751     }
5752
5753   icode = optab_handler (tab1, mode);
5754   nunits = GET_MODE_NUNITS (mode);
5755   wmode = insn_data[icode].operand[0].mode;
5756   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
5757   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
5758
5759   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5760   create_input_operand (&eops[1], op0, mode);
5761   create_input_operand (&eops[2], op1, mode);
5762   expand_insn (icode, 3, eops);
5763   m1 = gen_lowpart (mode, eops[0].value);
5764
5765   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
5766   create_input_operand (&eops[1], op0, mode);
5767   create_input_operand (&eops[2], op1, mode);
5768   expand_insn (optab_handler (tab2, mode), 3, eops);
5769   m2 = gen_lowpart (mode, eops[0].value);
5770
5771   v = rtvec_alloc (nunits);
5772   if (method == 2)
5773     {
5774       for (i = 0; i < nunits; ++i)
5775         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
5776                                     + ((i & 1) ? nunits : 0));
5777     }
5778   else
5779     {
5780       for (i = 0; i < nunits; ++i)
5781         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
5782     }
5783   perm = gen_rtx_CONST_VECTOR (mode, v);
5784
5785   return expand_vec_perm (mode, m1, m2, perm, target);
5786 }
5787 \f
5788 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
5789    pattern.  */
5790
5791 static void
5792 find_cc_set (rtx x, const_rtx pat, void *data)
5793 {
5794   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
5795       && GET_CODE (pat) == SET)
5796     {
5797       rtx *p_cc_reg = (rtx *) data;
5798       gcc_assert (!*p_cc_reg);
5799       *p_cc_reg = x;
5800     }
5801 }
5802
5803 /* This is a helper function for the other atomic operations.  This function
5804    emits a loop that contains SEQ that iterates until a compare-and-swap
5805    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
5806    a set of instructions that takes a value from OLD_REG as an input and
5807    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
5808    set to the current contents of MEM.  After SEQ, a compare-and-swap will
5809    attempt to update MEM with NEW_REG.  The function returns true when the
5810    loop was generated successfully.  */
5811
5812 static bool
5813 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
5814 {
5815   machine_mode mode = GET_MODE (mem);
5816   rtx_code_label *label;
5817   rtx cmp_reg, success, oldval;
5818
5819   /* The loop we want to generate looks like
5820
5821         cmp_reg = mem;
5822       label:
5823         old_reg = cmp_reg;
5824         seq;
5825         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
5826         if (success)
5827           goto label;
5828
5829      Note that we only do the plain load from memory once.  Subsequent
5830      iterations use the value loaded by the compare-and-swap pattern.  */
5831
5832   label = gen_label_rtx ();
5833   cmp_reg = gen_reg_rtx (mode);
5834
5835   emit_move_insn (cmp_reg, mem);
5836   emit_label (label);
5837   emit_move_insn (old_reg, cmp_reg);
5838   if (seq)
5839     emit_insn (seq);
5840
5841   success = NULL_RTX;
5842   oldval = cmp_reg;
5843   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
5844                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
5845                                        MEMMODEL_RELAXED))
5846     return false;
5847
5848   if (oldval != cmp_reg)
5849     emit_move_insn (cmp_reg, oldval);
5850
5851   /* Mark this jump predicted not taken.  */
5852   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
5853                            GET_MODE (success), 1, label,
5854                            profile_probability::guessed_never ());
5855   return true;
5856 }
5857
5858
5859 /* This function tries to emit an atomic_exchange intruction.  VAL is written
5860    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
5861    using TARGET if possible.  */
5862
5863 static rtx
5864 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
5865 {
5866   machine_mode mode = GET_MODE (mem);
5867   enum insn_code icode;
5868
5869   /* If the target supports the exchange directly, great.  */
5870   icode = direct_optab_handler (atomic_exchange_optab, mode);
5871   if (icode != CODE_FOR_nothing)
5872     {
5873       struct expand_operand ops[4];
5874
5875       create_output_operand (&ops[0], target, mode);
5876       create_fixed_operand (&ops[1], mem);
5877       create_input_operand (&ops[2], val, mode);
5878       create_integer_operand (&ops[3], model);
5879       if (maybe_expand_insn (icode, 4, ops))
5880         return ops[0].value;
5881     }
5882
5883   return NULL_RTX;
5884 }
5885
5886 /* This function tries to implement an atomic exchange operation using
5887    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
5888    The previous contents of *MEM are returned, using TARGET if possible.
5889    Since this instructionn is an acquire barrier only, stronger memory
5890    models may require additional barriers to be emitted.  */
5891
5892 static rtx
5893 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
5894                                    enum memmodel model)
5895 {
5896   machine_mode mode = GET_MODE (mem);
5897   enum insn_code icode;
5898   rtx_insn *last_insn = get_last_insn ();
5899
5900   icode = optab_handler (sync_lock_test_and_set_optab, mode);
5901
5902   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
5903      exists, and the memory model is stronger than acquire, add a release
5904      barrier before the instruction.  */
5905
5906   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
5907     expand_mem_thread_fence (model);
5908
5909   if (icode != CODE_FOR_nothing)
5910     {
5911       struct expand_operand ops[3];
5912       create_output_operand (&ops[0], target, mode);
5913       create_fixed_operand (&ops[1], mem);
5914       create_input_operand (&ops[2], val, mode);
5915       if (maybe_expand_insn (icode, 3, ops))
5916         return ops[0].value;
5917     }
5918
5919   /* If an external test-and-set libcall is provided, use that instead of
5920      any external compare-and-swap that we might get from the compare-and-
5921      swap-loop expansion later.  */
5922   if (!can_compare_and_swap_p (mode, false))
5923     {
5924       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
5925       if (libfunc != NULL)
5926         {
5927           rtx addr;
5928
5929           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
5930           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
5931                                           mode, 2, addr, ptr_mode,
5932                                           val, mode);
5933         }
5934     }
5935
5936   /* If the test_and_set can't be emitted, eliminate any barrier that might
5937      have been emitted.  */
5938   delete_insns_since (last_insn);
5939   return NULL_RTX;
5940 }
5941
5942 /* This function tries to implement an atomic exchange operation using a
5943    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
5944    *MEM are returned, using TARGET if possible.  No memory model is required
5945    since a compare_and_swap loop is seq-cst.  */
5946
5947 static rtx
5948 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
5949 {
5950   machine_mode mode = GET_MODE (mem);
5951
5952   if (can_compare_and_swap_p (mode, true))
5953     {
5954       if (!target || !register_operand (target, mode))
5955         target = gen_reg_rtx (mode);
5956       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
5957         return target;
5958     }
5959
5960   return NULL_RTX;
5961 }
5962
5963 /* This function tries to implement an atomic test-and-set operation
5964    using the atomic_test_and_set instruction pattern.  A boolean value
5965    is returned from the operation, using TARGET if possible.  */
5966
5967 static rtx
5968 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
5969 {
5970   machine_mode pat_bool_mode;
5971   struct expand_operand ops[3];
5972
5973   if (!targetm.have_atomic_test_and_set ())
5974     return NULL_RTX;
5975
5976   /* While we always get QImode from __atomic_test_and_set, we get
5977      other memory modes from __sync_lock_test_and_set.  Note that we
5978      use no endian adjustment here.  This matches the 4.6 behavior
5979      in the Sparc backend.  */
5980   enum insn_code icode = targetm.code_for_atomic_test_and_set;
5981   gcc_checking_assert (insn_data[icode].operand[1].mode == QImode);
5982   if (GET_MODE (mem) != QImode)
5983     mem = adjust_address_nv (mem, QImode, 0);
5984
5985   pat_bool_mode = insn_data[icode].operand[0].mode;
5986   create_output_operand (&ops[0], target, pat_bool_mode);
5987   create_fixed_operand (&ops[1], mem);
5988   create_integer_operand (&ops[2], model);
5989
5990   if (maybe_expand_insn (icode, 3, ops))
5991     return ops[0].value;
5992   return NULL_RTX;
5993 }
5994
5995 /* This function expands the legacy _sync_lock test_and_set operation which is
5996    generally an atomic exchange.  Some limited targets only allow the
5997    constant 1 to be stored.  This is an ACQUIRE operation.
5998
5999    TARGET is an optional place to stick the return value.
6000    MEM is where VAL is stored.  */
6001
6002 rtx
6003 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
6004 {
6005   rtx ret;
6006
6007   /* Try an atomic_exchange first.  */
6008   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
6009   if (ret)
6010     return ret;
6011
6012   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
6013                                            MEMMODEL_SYNC_ACQUIRE);
6014   if (ret)
6015     return ret;
6016
6017   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6018   if (ret)
6019     return ret;
6020
6021   /* If there are no other options, try atomic_test_and_set if the value
6022      being stored is 1.  */
6023   if (val == const1_rtx)
6024     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
6025
6026   return ret;
6027 }
6028
6029 /* This function expands the atomic test_and_set operation:
6030    atomically store a boolean TRUE into MEM and return the previous value.
6031
6032    MEMMODEL is the memory model variant to use.
6033    TARGET is an optional place to stick the return value.  */
6034
6035 rtx
6036 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
6037 {
6038   machine_mode mode = GET_MODE (mem);
6039   rtx ret, trueval, subtarget;
6040
6041   ret = maybe_emit_atomic_test_and_set (target, mem, model);
6042   if (ret)
6043     return ret;
6044
6045   /* Be binary compatible with non-default settings of trueval, and different
6046      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
6047      another only has atomic-exchange.  */
6048   if (targetm.atomic_test_and_set_trueval == 1)
6049     {
6050       trueval = const1_rtx;
6051       subtarget = target ? target : gen_reg_rtx (mode);
6052     }
6053   else
6054     {
6055       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
6056       subtarget = gen_reg_rtx (mode);
6057     }
6058
6059   /* Try the atomic-exchange optab...  */
6060   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
6061
6062   /* ... then an atomic-compare-and-swap loop ... */
6063   if (!ret)
6064     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
6065
6066   /* ... before trying the vaguely defined legacy lock_test_and_set. */
6067   if (!ret)
6068     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
6069
6070   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
6071      things with the value 1.  Thus we try again without trueval.  */
6072   if (!ret && targetm.atomic_test_and_set_trueval != 1)
6073     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
6074
6075   /* Failing all else, assume a single threaded environment and simply
6076      perform the operation.  */
6077   if (!ret)
6078     {
6079       /* If the result is ignored skip the move to target.  */
6080       if (subtarget != const0_rtx)
6081         emit_move_insn (subtarget, mem);
6082
6083       emit_move_insn (mem, trueval);
6084       ret = subtarget;
6085     }
6086
6087   /* Recall that have to return a boolean value; rectify if trueval
6088      is not exactly one.  */
6089   if (targetm.atomic_test_and_set_trueval != 1)
6090     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
6091
6092   return ret;
6093 }
6094
6095 /* This function expands the atomic exchange operation:
6096    atomically store VAL in MEM and return the previous value in MEM.
6097
6098    MEMMODEL is the memory model variant to use.
6099    TARGET is an optional place to stick the return value.  */
6100
6101 rtx
6102 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
6103 {
6104   machine_mode mode = GET_MODE (mem);
6105   rtx ret;
6106
6107   /* If loads are not atomic for the required size and we are not called to
6108      provide a __sync builtin, do not do anything so that we stay consistent
6109      with atomic loads of the same size.  */
6110   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6111     return NULL_RTX;
6112
6113   ret = maybe_emit_atomic_exchange (target, mem, val, model);
6114
6115   /* Next try a compare-and-swap loop for the exchange.  */
6116   if (!ret)
6117     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
6118
6119   return ret;
6120 }
6121
6122 /* This function expands the atomic compare exchange operation:
6123
6124    *PTARGET_BOOL is an optional place to store the boolean success/failure.
6125    *PTARGET_OVAL is an optional place to store the old value from memory.
6126    Both target parameters may be NULL or const0_rtx to indicate that we do
6127    not care about that return value.  Both target parameters are updated on
6128    success to the actual location of the corresponding result.
6129
6130    MEMMODEL is the memory model variant to use.
6131
6132    The return value of the function is true for success.  */
6133
6134 bool
6135 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
6136                                 rtx mem, rtx expected, rtx desired,
6137                                 bool is_weak, enum memmodel succ_model,
6138                                 enum memmodel fail_model)
6139 {
6140   machine_mode mode = GET_MODE (mem);
6141   struct expand_operand ops[8];
6142   enum insn_code icode;
6143   rtx target_oval, target_bool = NULL_RTX;
6144   rtx libfunc;
6145
6146   /* If loads are not atomic for the required size and we are not called to
6147      provide a __sync builtin, do not do anything so that we stay consistent
6148      with atomic loads of the same size.  */
6149   if (!can_atomic_load_p (mode) && !is_mm_sync (succ_model))
6150     return false;
6151
6152   /* Load expected into a register for the compare and swap.  */
6153   if (MEM_P (expected))
6154     expected = copy_to_reg (expected);
6155
6156   /* Make sure we always have some place to put the return oldval.
6157      Further, make sure that place is distinct from the input expected,
6158      just in case we need that path down below.  */
6159   if (ptarget_oval && *ptarget_oval == const0_rtx)
6160     ptarget_oval = NULL;
6161
6162   if (ptarget_oval == NULL
6163       || (target_oval = *ptarget_oval) == NULL
6164       || reg_overlap_mentioned_p (expected, target_oval))
6165     target_oval = gen_reg_rtx (mode);
6166
6167   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
6168   if (icode != CODE_FOR_nothing)
6169     {
6170       machine_mode bool_mode = insn_data[icode].operand[0].mode;
6171
6172       if (ptarget_bool && *ptarget_bool == const0_rtx)
6173         ptarget_bool = NULL;
6174
6175       /* Make sure we always have a place for the bool operand.  */
6176       if (ptarget_bool == NULL
6177           || (target_bool = *ptarget_bool) == NULL
6178           || GET_MODE (target_bool) != bool_mode)
6179         target_bool = gen_reg_rtx (bool_mode);
6180
6181       /* Emit the compare_and_swap.  */
6182       create_output_operand (&ops[0], target_bool, bool_mode);
6183       create_output_operand (&ops[1], target_oval, mode);
6184       create_fixed_operand (&ops[2], mem);
6185       create_input_operand (&ops[3], expected, mode);
6186       create_input_operand (&ops[4], desired, mode);
6187       create_integer_operand (&ops[5], is_weak);
6188       create_integer_operand (&ops[6], succ_model);
6189       create_integer_operand (&ops[7], fail_model);
6190       if (maybe_expand_insn (icode, 8, ops))
6191         {
6192           /* Return success/failure.  */
6193           target_bool = ops[0].value;
6194           target_oval = ops[1].value;
6195           goto success;
6196         }
6197     }
6198
6199   /* Otherwise fall back to the original __sync_val_compare_and_swap
6200      which is always seq-cst.  */
6201   icode = optab_handler (sync_compare_and_swap_optab, mode);
6202   if (icode != CODE_FOR_nothing)
6203     {
6204       rtx cc_reg;
6205
6206       create_output_operand (&ops[0], target_oval, mode);
6207       create_fixed_operand (&ops[1], mem);
6208       create_input_operand (&ops[2], expected, mode);
6209       create_input_operand (&ops[3], desired, mode);
6210       if (!maybe_expand_insn (icode, 4, ops))
6211         return false;
6212
6213       target_oval = ops[0].value;
6214
6215       /* If the caller isn't interested in the boolean return value,
6216          skip the computation of it.  */
6217       if (ptarget_bool == NULL)
6218         goto success;
6219
6220       /* Otherwise, work out if the compare-and-swap succeeded.  */
6221       cc_reg = NULL_RTX;
6222       if (have_insn_for (COMPARE, CCmode))
6223         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
6224       if (cc_reg)
6225         {
6226           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
6227                                                const0_rtx, VOIDmode, 0, 1);
6228           goto success;
6229         }
6230       goto success_bool_from_val;
6231     }
6232
6233   /* Also check for library support for __sync_val_compare_and_swap.  */
6234   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
6235   if (libfunc != NULL)
6236     {
6237       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6238       rtx target = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
6239                                             mode, 3, addr, ptr_mode,
6240                                             expected, mode, desired, mode);
6241       emit_move_insn (target_oval, target);
6242
6243       /* Compute the boolean return value only if requested.  */
6244       if (ptarget_bool)
6245         goto success_bool_from_val;
6246       else
6247         goto success;
6248     }
6249
6250   /* Failure.  */
6251   return false;
6252
6253  success_bool_from_val:
6254    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
6255                                         expected, VOIDmode, 1, 1);
6256  success:
6257   /* Make sure that the oval output winds up where the caller asked.  */
6258   if (ptarget_oval)
6259     *ptarget_oval = target_oval;
6260   if (ptarget_bool)
6261     *ptarget_bool = target_bool;
6262   return true;
6263 }
6264
6265 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
6266
6267 static void
6268 expand_asm_memory_barrier (void)
6269 {
6270   rtx asm_op, clob;
6271
6272   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, "", "", 0,
6273                                  rtvec_alloc (0), rtvec_alloc (0),
6274                                  rtvec_alloc (0), UNKNOWN_LOCATION);
6275   MEM_VOLATILE_P (asm_op) = 1;
6276
6277   clob = gen_rtx_SCRATCH (VOIDmode);
6278   clob = gen_rtx_MEM (BLKmode, clob);
6279   clob = gen_rtx_CLOBBER (VOIDmode, clob);
6280
6281   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
6282 }
6283
6284 /* This routine will either emit the mem_thread_fence pattern or issue a
6285    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6286
6287 void
6288 expand_mem_thread_fence (enum memmodel model)
6289 {
6290   if (is_mm_relaxed (model))
6291     return;
6292   if (targetm.have_mem_thread_fence ())
6293     {
6294       emit_insn (targetm.gen_mem_thread_fence (GEN_INT (model)));
6295       expand_asm_memory_barrier ();
6296     }
6297   else if (targetm.have_memory_barrier ())
6298     emit_insn (targetm.gen_memory_barrier ());
6299   else if (synchronize_libfunc != NULL_RTX)
6300     emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
6301   else
6302     expand_asm_memory_barrier ();
6303 }
6304
6305 /* This routine will either emit the mem_signal_fence pattern or issue a
6306    sync_synchronize to generate a fence for memory model MEMMODEL.  */
6307
6308 void
6309 expand_mem_signal_fence (enum memmodel model)
6310 {
6311   if (targetm.have_mem_signal_fence ())
6312     emit_insn (targetm.gen_mem_signal_fence (GEN_INT (model)));
6313   else if (!is_mm_relaxed (model))
6314     {
6315       /* By default targets are coherent between a thread and the signal
6316          handler running on the same thread.  Thus this really becomes a
6317          compiler barrier, in that stores must not be sunk past
6318          (or raised above) a given point.  */
6319       expand_asm_memory_barrier ();
6320     }
6321 }
6322
6323 /* This function expands the atomic load operation:
6324    return the atomically loaded value in MEM.
6325
6326    MEMMODEL is the memory model variant to use.
6327    TARGET is an option place to stick the return value.  */
6328
6329 rtx
6330 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
6331 {
6332   machine_mode mode = GET_MODE (mem);
6333   enum insn_code icode;
6334
6335   /* If the target supports the load directly, great.  */
6336   icode = direct_optab_handler (atomic_load_optab, mode);
6337   if (icode != CODE_FOR_nothing)
6338     {
6339       struct expand_operand ops[3];
6340
6341       create_output_operand (&ops[0], target, mode);
6342       create_fixed_operand (&ops[1], mem);
6343       create_integer_operand (&ops[2], model);
6344       if (maybe_expand_insn (icode, 3, ops))
6345         return ops[0].value;
6346     }
6347
6348   /* If the size of the object is greater than word size on this target,
6349      then we assume that a load will not be atomic.  We could try to
6350      emulate a load with a compare-and-swap operation, but the store that
6351      doing this could result in would be incorrect if this is a volatile
6352      atomic load or targetting read-only-mapped memory.  */
6353   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6354     /* If there is no atomic load, leave the library call.  */
6355     return NULL_RTX;
6356
6357   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
6358   if (!target || target == const0_rtx)
6359     target = gen_reg_rtx (mode);
6360
6361   /* For SEQ_CST, emit a barrier before the load.  */
6362   if (is_mm_seq_cst (model))
6363     expand_mem_thread_fence (model);
6364
6365   emit_move_insn (target, mem);
6366
6367   /* Emit the appropriate barrier after the load.  */
6368   expand_mem_thread_fence (model);
6369
6370   return target;
6371 }
6372
6373 /* This function expands the atomic store operation:
6374    Atomically store VAL in MEM.
6375    MEMMODEL is the memory model variant to use.
6376    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
6377    function returns const0_rtx if a pattern was emitted.  */
6378
6379 rtx
6380 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
6381 {
6382   machine_mode mode = GET_MODE (mem);
6383   enum insn_code icode;
6384   struct expand_operand ops[3];
6385
6386   /* If the target supports the store directly, great.  */
6387   icode = direct_optab_handler (atomic_store_optab, mode);
6388   if (icode != CODE_FOR_nothing)
6389     {
6390       create_fixed_operand (&ops[0], mem);
6391       create_input_operand (&ops[1], val, mode);
6392       create_integer_operand (&ops[2], model);
6393       if (maybe_expand_insn (icode, 3, ops))
6394         return const0_rtx;
6395     }
6396
6397   /* If using __sync_lock_release is a viable alternative, try it.
6398      Note that this will not be set to true if we are expanding a generic
6399      __atomic_store_n.  */
6400   if (use_release)
6401     {
6402       icode = direct_optab_handler (sync_lock_release_optab, mode);
6403       if (icode != CODE_FOR_nothing)
6404         {
6405           create_fixed_operand (&ops[0], mem);
6406           create_input_operand (&ops[1], const0_rtx, mode);
6407           if (maybe_expand_insn (icode, 2, ops))
6408             {
6409               /* lock_release is only a release barrier.  */
6410               if (is_mm_seq_cst (model))
6411                 expand_mem_thread_fence (model);
6412               return const0_rtx;
6413             }
6414         }
6415     }
6416
6417   /* If the size of the object is greater than word size on this target,
6418      a default store will not be atomic.  */
6419   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
6420     {
6421       /* If loads are atomic or we are called to provide a __sync builtin,
6422          we can try a atomic_exchange and throw away the result.  Otherwise,
6423          don't do anything so that we do not create an inconsistency between
6424          loads and stores.  */
6425       if (can_atomic_load_p (mode) || is_mm_sync (model))
6426         {
6427           rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
6428           if (!target)
6429             target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem,
6430                                                                 val);
6431           if (target)
6432             return const0_rtx;
6433         }
6434         return NULL_RTX;
6435     }
6436
6437   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
6438   expand_mem_thread_fence (model);
6439
6440   emit_move_insn (mem, val);
6441
6442   /* For SEQ_CST, also emit a barrier after the store.  */
6443   if (is_mm_seq_cst (model))
6444     expand_mem_thread_fence (model);
6445
6446   return const0_rtx;
6447 }
6448
6449
6450 /* Structure containing the pointers and values required to process the
6451    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
6452
6453 struct atomic_op_functions
6454 {
6455   direct_optab mem_fetch_before;
6456   direct_optab mem_fetch_after;
6457   direct_optab mem_no_result;
6458   optab fetch_before;
6459   optab fetch_after;
6460   direct_optab no_result;
6461   enum rtx_code reverse_code;
6462 };
6463
6464
6465 /* Fill in structure pointed to by OP with the various optab entries for an
6466    operation of type CODE.  */
6467
6468 static void
6469 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
6470 {
6471   gcc_assert (op!= NULL);
6472
6473   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
6474      in the source code during compilation, and the optab entries are not
6475      computable until runtime.  Fill in the values at runtime.  */
6476   switch (code)
6477     {
6478     case PLUS:
6479       op->mem_fetch_before = atomic_fetch_add_optab;
6480       op->mem_fetch_after = atomic_add_fetch_optab;
6481       op->mem_no_result = atomic_add_optab;
6482       op->fetch_before = sync_old_add_optab;
6483       op->fetch_after = sync_new_add_optab;
6484       op->no_result = sync_add_optab;
6485       op->reverse_code = MINUS;
6486       break;
6487     case MINUS:
6488       op->mem_fetch_before = atomic_fetch_sub_optab;
6489       op->mem_fetch_after = atomic_sub_fetch_optab;
6490       op->mem_no_result = atomic_sub_optab;
6491       op->fetch_before = sync_old_sub_optab;
6492       op->fetch_after = sync_new_sub_optab;
6493       op->no_result = sync_sub_optab;
6494       op->reverse_code = PLUS;
6495       break;
6496     case XOR:
6497       op->mem_fetch_before = atomic_fetch_xor_optab;
6498       op->mem_fetch_after = atomic_xor_fetch_optab;
6499       op->mem_no_result = atomic_xor_optab;
6500       op->fetch_before = sync_old_xor_optab;
6501       op->fetch_after = sync_new_xor_optab;
6502       op->no_result = sync_xor_optab;
6503       op->reverse_code = XOR;
6504       break;
6505     case AND:
6506       op->mem_fetch_before = atomic_fetch_and_optab;
6507       op->mem_fetch_after = atomic_and_fetch_optab;
6508       op->mem_no_result = atomic_and_optab;
6509       op->fetch_before = sync_old_and_optab;
6510       op->fetch_after = sync_new_and_optab;
6511       op->no_result = sync_and_optab;
6512       op->reverse_code = UNKNOWN;
6513       break;
6514     case IOR:
6515       op->mem_fetch_before = atomic_fetch_or_optab;
6516       op->mem_fetch_after = atomic_or_fetch_optab;
6517       op->mem_no_result = atomic_or_optab;
6518       op->fetch_before = sync_old_ior_optab;
6519       op->fetch_after = sync_new_ior_optab;
6520       op->no_result = sync_ior_optab;
6521       op->reverse_code = UNKNOWN;
6522       break;
6523     case NOT:
6524       op->mem_fetch_before = atomic_fetch_nand_optab;
6525       op->mem_fetch_after = atomic_nand_fetch_optab;
6526       op->mem_no_result = atomic_nand_optab;
6527       op->fetch_before = sync_old_nand_optab;
6528       op->fetch_after = sync_new_nand_optab;
6529       op->no_result = sync_nand_optab;
6530       op->reverse_code = UNKNOWN;
6531       break;
6532     default:
6533       gcc_unreachable ();
6534     }
6535 }
6536
6537 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
6538    using memory order MODEL.  If AFTER is true the operation needs to return
6539    the value of *MEM after the operation, otherwise the previous value.
6540    TARGET is an optional place to place the result.  The result is unused if
6541    it is const0_rtx.
6542    Return the result if there is a better sequence, otherwise NULL_RTX.  */
6543
6544 static rtx
6545 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6546                          enum memmodel model, bool after)
6547 {
6548   /* If the value is prefetched, or not used, it may be possible to replace
6549      the sequence with a native exchange operation.  */
6550   if (!after || target == const0_rtx)
6551     {
6552       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
6553       if (code == AND && val == const0_rtx)
6554         {
6555           if (target == const0_rtx)
6556             target = gen_reg_rtx (GET_MODE (mem));
6557           return maybe_emit_atomic_exchange (target, mem, val, model);
6558         }
6559
6560       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
6561       if (code == IOR && val == constm1_rtx)
6562         {
6563           if (target == const0_rtx)
6564             target = gen_reg_rtx (GET_MODE (mem));
6565           return maybe_emit_atomic_exchange (target, mem, val, model);
6566         }
6567     }
6568
6569   return NULL_RTX;
6570 }
6571
6572 /* Try to emit an instruction for a specific operation varaition.
6573    OPTAB contains the OP functions.
6574    TARGET is an optional place to return the result. const0_rtx means unused.
6575    MEM is the memory location to operate on.
6576    VAL is the value to use in the operation.
6577    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
6578    MODEL is the memory model, if used.
6579    AFTER is true if the returned result is the value after the operation.  */
6580
6581 static rtx
6582 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
6583                rtx val, bool use_memmodel, enum memmodel model, bool after)
6584 {
6585   machine_mode mode = GET_MODE (mem);
6586   struct expand_operand ops[4];
6587   enum insn_code icode;
6588   int op_counter = 0;
6589   int num_ops;
6590
6591   /* Check to see if there is a result returned.  */
6592   if (target == const0_rtx)
6593     {
6594       if (use_memmodel)
6595         {
6596           icode = direct_optab_handler (optab->mem_no_result, mode);
6597           create_integer_operand (&ops[2], model);
6598           num_ops = 3;
6599         }
6600       else
6601         {
6602           icode = direct_optab_handler (optab->no_result, mode);
6603           num_ops = 2;
6604         }
6605     }
6606   /* Otherwise, we need to generate a result.  */
6607   else
6608     {
6609       if (use_memmodel)
6610         {
6611           icode = direct_optab_handler (after ? optab->mem_fetch_after
6612                                         : optab->mem_fetch_before, mode);
6613           create_integer_operand (&ops[3], model);
6614           num_ops = 4;
6615         }
6616       else
6617         {
6618           icode = optab_handler (after ? optab->fetch_after
6619                                  : optab->fetch_before, mode);
6620           num_ops = 3;
6621         }
6622       create_output_operand (&ops[op_counter++], target, mode);
6623     }
6624   if (icode == CODE_FOR_nothing)
6625     return NULL_RTX;
6626
6627   create_fixed_operand (&ops[op_counter++], mem);
6628   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
6629   create_convert_operand_to (&ops[op_counter++], val, mode, true);
6630
6631   if (maybe_expand_insn (icode, num_ops, ops))
6632     return (target == const0_rtx ? const0_rtx : ops[0].value);
6633
6634   return NULL_RTX;
6635 }
6636
6637
6638 /* This function expands an atomic fetch_OP or OP_fetch operation:
6639    TARGET is an option place to stick the return value.  const0_rtx indicates
6640    the result is unused.
6641    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6642    CODE is the operation being performed (OP)
6643    MEMMODEL is the memory model variant to use.
6644    AFTER is true to return the result of the operation (OP_fetch).
6645    AFTER is false to return the value before the operation (fetch_OP).
6646
6647    This function will *only* generate instructions if there is a direct
6648    optab. No compare and swap loops or libcalls will be generated. */
6649
6650 static rtx
6651 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
6652                                     enum rtx_code code, enum memmodel model,
6653                                     bool after)
6654 {
6655   machine_mode mode = GET_MODE (mem);
6656   struct atomic_op_functions optab;
6657   rtx result;
6658   bool unused_result = (target == const0_rtx);
6659
6660   get_atomic_op_for_code (&optab, code);
6661
6662   /* Check to see if there are any better instructions.  */
6663   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
6664   if (result)
6665     return result;
6666
6667   /* Check for the case where the result isn't used and try those patterns.  */
6668   if (unused_result)
6669     {
6670       /* Try the memory model variant first.  */
6671       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
6672       if (result)
6673         return result;
6674
6675       /* Next try the old style withuot a memory model.  */
6676       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
6677       if (result)
6678         return result;
6679
6680       /* There is no no-result pattern, so try patterns with a result.  */
6681       target = NULL_RTX;
6682     }
6683
6684   /* Try the __atomic version.  */
6685   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
6686   if (result)
6687     return result;
6688
6689   /* Try the older __sync version.  */
6690   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
6691   if (result)
6692     return result;
6693
6694   /* If the fetch value can be calculated from the other variation of fetch,
6695      try that operation.  */
6696   if (after || unused_result || optab.reverse_code != UNKNOWN)
6697     {
6698       /* Try the __atomic version, then the older __sync version.  */
6699       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
6700       if (!result)
6701         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
6702
6703       if (result)
6704         {
6705           /* If the result isn't used, no need to do compensation code.  */
6706           if (unused_result)
6707             return result;
6708
6709           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
6710              Fetch_before == after REVERSE_OP val.  */
6711           if (!after)
6712             code = optab.reverse_code;
6713           if (code == NOT)
6714             {
6715               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
6716                                             true, OPTAB_LIB_WIDEN);
6717               result = expand_simple_unop (mode, NOT, result, target, true);
6718             }
6719           else
6720             result = expand_simple_binop (mode, code, result, val, target,
6721                                           true, OPTAB_LIB_WIDEN);
6722           return result;
6723         }
6724     }
6725
6726   /* No direct opcode can be generated.  */
6727   return NULL_RTX;
6728 }
6729
6730
6731
6732 /* This function expands an atomic fetch_OP or OP_fetch operation:
6733    TARGET is an option place to stick the return value.  const0_rtx indicates
6734    the result is unused.
6735    atomically fetch MEM, perform the operation with VAL and return it to MEM.
6736    CODE is the operation being performed (OP)
6737    MEMMODEL is the memory model variant to use.
6738    AFTER is true to return the result of the operation (OP_fetch).
6739    AFTER is false to return the value before the operation (fetch_OP).  */
6740 rtx
6741 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
6742                         enum memmodel model, bool after)
6743 {
6744   machine_mode mode = GET_MODE (mem);
6745   rtx result;
6746   bool unused_result = (target == const0_rtx);
6747
6748   /* If loads are not atomic for the required size and we are not called to
6749      provide a __sync builtin, do not do anything so that we stay consistent
6750      with atomic loads of the same size.  */
6751   if (!can_atomic_load_p (mode) && !is_mm_sync (model))
6752     return NULL_RTX;
6753
6754   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
6755                                                after);
6756
6757   if (result)
6758     return result;
6759
6760   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
6761   if (code == PLUS || code == MINUS)
6762     {
6763       rtx tmp;
6764       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
6765
6766       start_sequence ();
6767       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
6768       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
6769                                                    model, after);
6770       if (result)
6771         {
6772           /* PLUS worked so emit the insns and return.  */
6773           tmp = get_insns ();
6774           end_sequence ();
6775           emit_insn (tmp);
6776           return result;
6777         }
6778
6779       /* PLUS did not work, so throw away the negation code and continue.  */
6780       end_sequence ();
6781     }
6782
6783   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
6784   if (!can_compare_and_swap_p (mode, false))
6785     {
6786       rtx libfunc;
6787       bool fixup = false;
6788       enum rtx_code orig_code = code;
6789       struct atomic_op_functions optab;
6790
6791       get_atomic_op_for_code (&optab, code);
6792       libfunc = optab_libfunc (after ? optab.fetch_after
6793                                : optab.fetch_before, mode);
6794       if (libfunc == NULL
6795           && (after || unused_result || optab.reverse_code != UNKNOWN))
6796         {
6797           fixup = true;
6798           if (!after)
6799             code = optab.reverse_code;
6800           libfunc = optab_libfunc (after ? optab.fetch_before
6801                                    : optab.fetch_after, mode);
6802         }
6803       if (libfunc != NULL)
6804         {
6805           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
6806           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
6807                                             2, addr, ptr_mode, val, mode);
6808
6809           if (!unused_result && fixup)
6810             result = expand_simple_binop (mode, code, result, val, target,
6811                                           true, OPTAB_LIB_WIDEN);
6812           return result;
6813         }
6814
6815       /* We need the original code for any further attempts.  */
6816       code = orig_code;
6817     }
6818
6819   /* If nothing else has succeeded, default to a compare and swap loop.  */
6820   if (can_compare_and_swap_p (mode, true))
6821     {
6822       rtx_insn *insn;
6823       rtx t0 = gen_reg_rtx (mode), t1;
6824
6825       start_sequence ();
6826
6827       /* If the result is used, get a register for it.  */
6828       if (!unused_result)
6829         {
6830           if (!target || !register_operand (target, mode))
6831             target = gen_reg_rtx (mode);
6832           /* If fetch_before, copy the value now.  */
6833           if (!after)
6834             emit_move_insn (target, t0);
6835         }
6836       else
6837         target = const0_rtx;
6838
6839       t1 = t0;
6840       if (code == NOT)
6841         {
6842           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
6843                                     true, OPTAB_LIB_WIDEN);
6844           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
6845         }
6846       else
6847         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
6848                                   OPTAB_LIB_WIDEN);
6849
6850       /* For after, copy the value now.  */
6851       if (!unused_result && after)
6852         emit_move_insn (target, t1);
6853       insn = get_insns ();
6854       end_sequence ();
6855
6856       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
6857         return target;
6858     }
6859
6860   return NULL_RTX;
6861 }
6862 \f
6863 /* Return true if OPERAND is suitable for operand number OPNO of
6864    instruction ICODE.  */
6865
6866 bool
6867 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
6868 {
6869   return (!insn_data[(int) icode].operand[opno].predicate
6870           || (insn_data[(int) icode].operand[opno].predicate
6871               (operand, insn_data[(int) icode].operand[opno].mode)));
6872 }
6873 \f
6874 /* TARGET is a target of a multiword operation that we are going to
6875    implement as a series of word-mode operations.  Return true if
6876    TARGET is suitable for this purpose.  */
6877
6878 bool
6879 valid_multiword_target_p (rtx target)
6880 {
6881   machine_mode mode;
6882   int i;
6883
6884   mode = GET_MODE (target);
6885   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
6886     if (!validate_subreg (word_mode, mode, target, i))
6887       return false;
6888   return true;
6889 }
6890
6891 /* Like maybe_legitimize_operand, but do not change the code of the
6892    current rtx value.  */
6893
6894 static bool
6895 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
6896                                     struct expand_operand *op)
6897 {
6898   /* See if the operand matches in its current form.  */
6899   if (insn_operand_matches (icode, opno, op->value))
6900     return true;
6901
6902   /* If the operand is a memory whose address has no side effects,
6903      try forcing the address into a non-virtual pseudo register.
6904      The check for side effects is important because copy_to_mode_reg
6905      cannot handle things like auto-modified addresses.  */
6906   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
6907     {
6908       rtx addr, mem;
6909
6910       mem = op->value;
6911       addr = XEXP (mem, 0);
6912       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
6913           && !side_effects_p (addr))
6914         {
6915           rtx_insn *last;
6916           machine_mode mode;
6917
6918           last = get_last_insn ();
6919           mode = get_address_mode (mem);
6920           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
6921           if (insn_operand_matches (icode, opno, mem))
6922             {
6923               op->value = mem;
6924               return true;
6925             }
6926           delete_insns_since (last);
6927         }
6928     }
6929
6930   return false;
6931 }
6932
6933 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
6934    on success, storing the new operand value back in OP.  */
6935
6936 static bool
6937 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
6938                           struct expand_operand *op)
6939 {
6940   machine_mode mode, imode;
6941   bool old_volatile_ok, result;
6942
6943   mode = op->mode;
6944   switch (op->type)
6945     {
6946     case EXPAND_FIXED:
6947       old_volatile_ok = volatile_ok;
6948       volatile_ok = true;
6949       result = maybe_legitimize_operand_same_code (icode, opno, op);
6950       volatile_ok = old_volatile_ok;
6951       return result;
6952
6953     case EXPAND_OUTPUT:
6954       gcc_assert (mode != VOIDmode);
6955       if (op->value
6956           && op->value != const0_rtx
6957           && GET_MODE (op->value) == mode
6958           && maybe_legitimize_operand_same_code (icode, opno, op))
6959         return true;
6960
6961       op->value = gen_reg_rtx (mode);
6962       op->target = 0;
6963       break;
6964
6965     case EXPAND_INPUT:
6966     input:
6967       gcc_assert (mode != VOIDmode);
6968       gcc_assert (GET_MODE (op->value) == VOIDmode
6969                   || GET_MODE (op->value) == mode);
6970       if (maybe_legitimize_operand_same_code (icode, opno, op))
6971         return true;
6972
6973       op->value = copy_to_mode_reg (mode, op->value);
6974       break;
6975
6976     case EXPAND_CONVERT_TO:
6977       gcc_assert (mode != VOIDmode);
6978       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
6979       goto input;
6980
6981     case EXPAND_CONVERT_FROM:
6982       if (GET_MODE (op->value) != VOIDmode)
6983         mode = GET_MODE (op->value);
6984       else
6985         /* The caller must tell us what mode this value has.  */
6986         gcc_assert (mode != VOIDmode);
6987
6988       imode = insn_data[(int) icode].operand[opno].mode;
6989       if (imode != VOIDmode && imode != mode)
6990         {
6991           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
6992           mode = imode;
6993         }
6994       goto input;
6995
6996     case EXPAND_ADDRESS:
6997       op->value = convert_memory_address (as_a <scalar_int_mode> (mode),
6998                                           op->value);
6999       goto input;
7000
7001     case EXPAND_INTEGER:
7002       mode = insn_data[(int) icode].operand[opno].mode;
7003       if (mode != VOIDmode && const_int_operand (op->value, mode))
7004         goto input;
7005       break;
7006     }
7007   return insn_operand_matches (icode, opno, op->value);
7008 }
7009
7010 /* Make OP describe an input operand that should have the same value
7011    as VALUE, after any mode conversion that the target might request.
7012    TYPE is the type of VALUE.  */
7013
7014 void
7015 create_convert_operand_from_type (struct expand_operand *op,
7016                                   rtx value, tree type)
7017 {
7018   create_convert_operand_from (op, value, TYPE_MODE (type),
7019                                TYPE_UNSIGNED (type));
7020 }
7021
7022 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
7023    of instruction ICODE.  Return true on success, leaving the new operand
7024    values in the OPS themselves.  Emit no code on failure.  */
7025
7026 bool
7027 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
7028                            unsigned int nops, struct expand_operand *ops)
7029 {
7030   rtx_insn *last;
7031   unsigned int i;
7032
7033   last = get_last_insn ();
7034   for (i = 0; i < nops; i++)
7035     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
7036       {
7037         delete_insns_since (last);
7038         return false;
7039       }
7040   return true;
7041 }
7042
7043 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
7044    as its operands.  Return the instruction pattern on success,
7045    and emit any necessary set-up code.  Return null and emit no
7046    code on failure.  */
7047
7048 rtx_insn *
7049 maybe_gen_insn (enum insn_code icode, unsigned int nops,
7050                 struct expand_operand *ops)
7051 {
7052   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
7053   if (!maybe_legitimize_operands (icode, 0, nops, ops))
7054     return NULL;
7055
7056   switch (nops)
7057     {
7058     case 1:
7059       return GEN_FCN (icode) (ops[0].value);
7060     case 2:
7061       return GEN_FCN (icode) (ops[0].value, ops[1].value);
7062     case 3:
7063       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
7064     case 4:
7065       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7066                               ops[3].value);
7067     case 5:
7068       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7069                               ops[3].value, ops[4].value);
7070     case 6:
7071       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7072                               ops[3].value, ops[4].value, ops[5].value);
7073     case 7:
7074       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7075                               ops[3].value, ops[4].value, ops[5].value,
7076                               ops[6].value);
7077     case 8:
7078       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7079                               ops[3].value, ops[4].value, ops[5].value,
7080                               ops[6].value, ops[7].value);
7081     case 9:
7082       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
7083                               ops[3].value, ops[4].value, ops[5].value,
7084                               ops[6].value, ops[7].value, ops[8].value);
7085     }
7086   gcc_unreachable ();
7087 }
7088
7089 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
7090    as its operands.  Return true on success and emit no code on failure.  */
7091
7092 bool
7093 maybe_expand_insn (enum insn_code icode, unsigned int nops,
7094                    struct expand_operand *ops)
7095 {
7096   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7097   if (pat)
7098     {
7099       emit_insn (pat);
7100       return true;
7101     }
7102   return false;
7103 }
7104
7105 /* Like maybe_expand_insn, but for jumps.  */
7106
7107 bool
7108 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
7109                         struct expand_operand *ops)
7110 {
7111   rtx_insn *pat = maybe_gen_insn (icode, nops, ops);
7112   if (pat)
7113     {
7114       emit_jump_insn (pat);
7115       return true;
7116     }
7117   return false;
7118 }
7119
7120 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
7121    as its operands.  */
7122
7123 void
7124 expand_insn (enum insn_code icode, unsigned int nops,
7125              struct expand_operand *ops)
7126 {
7127   if (!maybe_expand_insn (icode, nops, ops))
7128     gcc_unreachable ();
7129 }
7130
7131 /* Like expand_insn, but for jumps.  */
7132
7133 void
7134 expand_jump_insn (enum insn_code icode, unsigned int nops,
7135                   struct expand_operand *ops)
7136 {
7137   if (!maybe_expand_jump_insn (icode, nops, ops))
7138     gcc_unreachable ();
7139 }