gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_sib_address,
 294     invalid_vsib_address,
 295     invalid_vector_register_set,
 296     invalid_tmm_register_set,
 297     unsupported_vector_index_register,
 298     unsupported_broadcast,
 299     broadcast_needed,
 300     unsupported_masking,
 301     mask_not_on_destination,
 302     no_default_mask,
 303     unsupported_rc_sae,
 304     rc_sae_operand_not_last_imm,
 305     invalid_register_operand,
 306   };
 307
 308 struct _i386_insn
 309   {
 310     /* TM holds the template for the insn were currently assembling.  */
 311     insn_template tm;
 312
 313     /* SUFFIX holds the instruction size suffix for byte, word, dword
 314        or qword, if given.  */
 315     char suffix;
 316
 317     /* OPERANDS gives the number of given operands.  */
 318     unsigned int operands;
 319
 320     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 321        of given register, displacement, memory operands and immediate
 322        operands.  */
 323     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 324
 325     /* TYPES [i] is the type (see above #defines) which tells us how to
 326        use OP[i] for the corresponding operand.  */
 327     i386_operand_type types[MAX_OPERANDS];
 328
 329     /* Displacement expression, immediate expression, or register for each
 330        operand.  */
 331     union i386_op op[MAX_OPERANDS];
 332
 333     /* Flags for operands.  */
 334     unsigned int flags[MAX_OPERANDS];
 335 #define Operand_PCrel 1
 336 #define Operand_Mem   2
 337
 338     /* Relocation type for operand */
 339     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 340
 341     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 342        the base index byte below.  */
 343     const reg_entry *base_reg;
 344     const reg_entry *index_reg;
 345     unsigned int log2_scale_factor;
 346
 347     /* SEG gives the seg_entries of this insn.  They are zero unless
 348        explicit segment overrides are given.  */
 349     const seg_entry *seg[2];
 350
 351     /* Copied first memory operand string, for re-checking.  */
 352     char *memop1_string;
 353
 354     /* PREFIX holds all the given prefix opcodes (usually null).
 355        PREFIXES is the number of prefix opcodes.  */
 356     unsigned int prefixes;
 357     unsigned char prefix[MAX_PREFIXES];
 358
 359     /* Register is in low 3 bits of opcode.  */
 360     bfd_boolean short_form;
 361
 362     /* The operand to a branch insn indicates an absolute branch.  */
 363     bfd_boolean jumpabsolute;
 364
 365     /* Extended states.  */
 366     enum
 367       {
 368         /* Use MMX state.  */
 369         xstate_mmx = 1 << 0,
 370         /* Use XMM state.  */
 371         xstate_xmm = 1 << 1,
 372         /* Use YMM state.  */
 373         xstate_ymm = 1 << 2 | xstate_xmm,
 374         /* Use ZMM state.  */
 375         xstate_zmm = 1 << 3 | xstate_ymm,
 376         /* Use TMM state.  */
 377         xstate_tmm = 1 << 4
 378       } xstate;
 379
 380     /* Has GOTPC or TLS relocation.  */
 381     bfd_boolean has_gotpc_tls_reloc;
 382
 383     /* RM and SIB are the modrm byte and the sib byte where the
 384        addressing modes of this insn are encoded.  */
 385     modrm_byte rm;
 386     rex_byte rex;
 387     rex_byte vrex;
 388     sib_byte sib;
 389     vex_prefix vex;
 390
 391     /* Masking attributes.  */
 392     struct Mask_Operation *mask;
 393
 394     /* Rounding control and SAE attributes.  */
 395     struct RC_Operation *rounding;
 396
 397     /* Broadcasting attributes.  */
 398     struct Broadcast_Operation *broadcast;
 399
 400     /* Compressed disp8*N attribute.  */
 401     unsigned int memshift;
 402
 403     /* Prefer load or store in encoding.  */
 404     enum
 405       {
 406         dir_encoding_default = 0,
 407         dir_encoding_load,
 408         dir_encoding_store,
 409         dir_encoding_swap
 410       } dir_encoding;
 411
 412     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 413     enum
 414       {
 415         disp_encoding_default = 0,
 416         disp_encoding_8bit,
 417         disp_encoding_16bit,
 418         disp_encoding_32bit
 419       } disp_encoding;
 420
 421     /* Prefer the REX byte in encoding.  */
 422     bfd_boolean rex_encoding;
 423
 424     /* Disable instruction size optimization.  */
 425     bfd_boolean no_optimize;
 426
 427     /* How to encode vector instructions.  */
 428     enum
 429       {
 430         vex_encoding_default = 0,
 431         vex_encoding_vex,
 432         vex_encoding_vex3,
 433         vex_encoding_evex,
 434         vex_encoding_error
 435       } vec_encoding;
 436
 437     /* REP prefix.  */
 438     const char *rep_prefix;
 439
 440     /* HLE prefix.  */
 441     const char *hle_prefix;
 442
 443     /* Have BND prefix.  */
 444     const char *bnd_prefix;
 445
 446     /* Have NOTRACK prefix.  */
 447     const char *notrack_prefix;
 448
 449     /* Error message.  */
 450     enum i386_error error;
 451   };
 452
 453 typedef struct _i386_insn i386_insn;
 454
 455 /* Link RC type with corresponding string, that'll be looked for in
 456    asm.  */
 457 struct RC_name
 458 {
 459   enum rc_type type;
 460   const char *name;
 461   unsigned int len;
 462 };
 463
 464 static const struct RC_name RC_NamesTable[] =
 465 {
 466   {  rne, STRING_COMMA_LEN ("rn-sae") },
 467   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 468   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 469   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 470   {  saeonly,  STRING_COMMA_LEN ("sae") },
 471 };
 472
 473 /* List of chars besides those in app.c:symbol_chars that can start an
 474    operand.  Used to prevent the scrubber eating vital white-space.  */
 475 const char extra_symbol_chars[] = "*%-([{}"
 476 #ifdef LEX_AT
 477         "@"
 478 #endif
 479 #ifdef LEX_QM
 480         "?"
 481 #endif
 482         ;
 483
 484 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 485      && !defined (TE_GNU)                               \
 486      && !defined (TE_LINUX)                             \
 487      && !defined (TE_FreeBSD)                           \
 488      && !defined (TE_DragonFly)                         \
 489      && !defined (TE_NetBSD))
 490 /* This array holds the chars that always start a comment.  If the
 491    pre-processor is disabled, these aren't very useful.  The option
 492    --divide will remove '/' from this list.  */
 493 const char *i386_comment_chars = "#/";
 494 #define SVR4_COMMENT_CHARS 1
 495 #define PREFIX_SEPARATOR '\\'
 496
 497 #else
 498 const char *i386_comment_chars = "#";
 499 #define PREFIX_SEPARATOR '/'
 500 #endif
 501
 502 /* This array holds the chars that only start a comment at the beginning of
 503    a line.  If the line seems to have the form '# 123 filename'
 504    .line and .file directives will appear in the pre-processed output.
 505    Note that input_file.c hand checks for '#' at the beginning of the
 506    first line of the input file.  This is because the compiler outputs
 507    #NO_APP at the beginning of its output.
 508    Also note that comments started like this one will always work if
 509    '/' isn't otherwise defined.  */
 510 const char line_comment_chars[] = "#/";
 511
 512 const char line_separator_chars[] = ";";
 513
 514 /* Chars that can be used to separate mant from exp in floating point
 515    nums.  */
 516 const char EXP_CHARS[] = "eE";
 517
 518 /* Chars that mean this number is a floating point constant
 519    As in 0f12.456
 520    or    0d1.2345e12.  */
 521 const char FLT_CHARS[] = "fFdDxX";
 522
 523 /* Tables for lexical analysis.  */
 524 static char mnemonic_chars[256];
 525 static char register_chars[256];
 526 static char operand_chars[256];
 527 static char identifier_chars[256];
 528 static char digit_chars[256];
 529
 530 /* Lexical macros.  */
 531 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 532 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 533 #define is_register_char(x) (register_chars[(unsigned char) x])
 534 #define is_space_char(x) ((x) == ' ')
 535 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 536 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 537
 538 /* All non-digit non-letter characters that may occur in an operand.  */
 539 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 540
 541 /* md_assemble() always leaves the strings it's passed unaltered.  To
 542    effect this we maintain a stack of saved characters that we've smashed
 543    with '\0's (indicating end of strings for various sub-fields of the
 544    assembler instruction).  */
 545 static char save_stack[32];
 546 static char *save_stack_p;
 547 #define END_STRING_AND_SAVE(s) \
 548         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 549 #define RESTORE_END_STRING(s) \
 550         do { *(s) = *--save_stack_p; } while (0)
 551
 552 /* The instruction we're assembling.  */
 553 static i386_insn i;
 554
 555 /* Possible templates for current insn.  */
 556 static const templates *current_templates;
 557
 558 /* Per instruction expressionS buffers: max displacements & immediates.  */
 559 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 560 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 561
 562 /* Current operand we are working on.  */
 563 static int this_operand = -1;
 564
 565 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 566    these.  */
 567
 568 enum flag_code {
 569         CODE_32BIT,
 570         CODE_16BIT,
 571         CODE_64BIT };
 572
 573 static enum flag_code flag_code;
 574 static unsigned int object_64bit;
 575 static unsigned int disallow_64bit_reloc;
 576 static int use_rela_relocations = 0;
 577 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 578 static const char *tls_get_addr;
 579
 580 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 581      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 582      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 583
 584 /* The ELF ABI to use.  */
 585 enum x86_elf_abi
 586 {
 587   I386_ABI,
 588   X86_64_ABI,
 589   X86_64_X32_ABI
 590 };
 591
 592 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 593 #endif
 594
 595 #if defined (TE_PE) || defined (TE_PEP)
 596 /* Use big object file format.  */
 597 static int use_big_obj = 0;
 598 #endif
 599
 600 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 601 /* 1 if generating code for a shared library.  */
 602 static int shared = 0;
 603 #endif
 604
 605 /* 1 for intel syntax,
 606    0 if att syntax.  */
 607 static int intel_syntax = 0;
 608
 609 static enum x86_64_isa
 610 {
 611   amd64 = 1,    /* AMD64 ISA.  */
 612   intel64       /* Intel64 ISA.  */
 613 } isa64;
 614
 615 /* 1 for intel mnemonic,
 616    0 if att mnemonic.  */
 617 static int intel_mnemonic = !SYSV386_COMPAT;
 618
 619 /* 1 if pseudo registers are permitted.  */
 620 static int allow_pseudo_reg = 0;
 621
 622 /* 1 if register prefix % not required.  */
 623 static int allow_naked_reg = 0;
 624
 625 /* 1 if the assembler should add BND prefix for all control-transferring
 626    instructions supporting it, even if this prefix wasn't specified
 627    explicitly.  */
 628 static int add_bnd_prefix = 0;
 629
 630 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 631 static int allow_index_reg = 0;
 632
 633 /* 1 if the assembler should ignore LOCK prefix, even if it was
 634    specified explicitly.  */
 635 static int omit_lock_prefix = 0;
 636
 637 /* 1 if the assembler should encode lfence, mfence, and sfence as
 638    "lock addl $0, (%{re}sp)".  */
 639 static int avoid_fence = 0;
 640
 641 /* 1 if lfence should be inserted after every load.  */
 642 static int lfence_after_load = 0;
 643
 644 /* Non-zero if lfence should be inserted before indirect branch.  */
 645 static enum lfence_before_indirect_branch_kind
 646   {
 647     lfence_branch_none = 0,
 648     lfence_branch_register,
 649     lfence_branch_memory,
 650     lfence_branch_all
 651   }
 652 lfence_before_indirect_branch;
 653
 654 /* Non-zero if lfence should be inserted before ret.  */
 655 static enum lfence_before_ret_kind
 656   {
 657     lfence_before_ret_none = 0,
 658     lfence_before_ret_not,
 659     lfence_before_ret_or,
 660     lfence_before_ret_shl
 661   }
 662 lfence_before_ret;
 663
 664 /* Types of previous instruction is .byte or prefix.  */
 665 static struct
 666   {
 667     segT seg;
 668     const char *file;
 669     const char *name;
 670     unsigned int line;
 671     enum last_insn_kind
 672       {
 673         last_insn_other = 0,
 674         last_insn_directive,
 675         last_insn_prefix
 676       } kind;
 677   } last_insn;
 678
 679 /* 1 if the assembler should generate relax relocations.  */
 680
 681 static int generate_relax_relocations
 682   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 683
 684 static enum check_kind
 685   {
 686     check_none = 0,
 687     check_warning,
 688     check_error
 689   }
 690 sse_check, operand_check = check_warning;
 691
 692 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 693 static int align_branch_power = 0;
 694
 695 /* Types of branches to align.  */
 696 enum align_branch_kind
 697   {
 698     align_branch_none = 0,
 699     align_branch_jcc = 1,
 700     align_branch_fused = 2,
 701     align_branch_jmp = 3,
 702     align_branch_call = 4,
 703     align_branch_indirect = 5,
 704     align_branch_ret = 6
 705   };
 706
 707 /* Type bits of branches to align.  */
 708 enum align_branch_bit
 709   {
 710     align_branch_jcc_bit = 1 << align_branch_jcc,
 711     align_branch_fused_bit = 1 << align_branch_fused,
 712     align_branch_jmp_bit = 1 << align_branch_jmp,
 713     align_branch_call_bit = 1 << align_branch_call,
 714     align_branch_indirect_bit = 1 << align_branch_indirect,
 715     align_branch_ret_bit = 1 << align_branch_ret
 716   };
 717
 718 static unsigned int align_branch = (align_branch_jcc_bit
 719                                     | align_branch_fused_bit
 720                                     | align_branch_jmp_bit);
 721
 722 /* Types of condition jump used by macro-fusion.  */
 723 enum mf_jcc_kind
 724   {
 725     mf_jcc_jo = 0,  /* base opcode 0x70  */
 726     mf_jcc_jc,      /* base opcode 0x72  */
 727     mf_jcc_je,      /* base opcode 0x74  */
 728     mf_jcc_jna,     /* base opcode 0x76  */
 729     mf_jcc_js,      /* base opcode 0x78  */
 730     mf_jcc_jp,      /* base opcode 0x7a  */
 731     mf_jcc_jl,      /* base opcode 0x7c  */
 732     mf_jcc_jle,     /* base opcode 0x7e  */
 733   };
 734
 735 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 736 enum mf_cmp_kind
 737   {
 738     mf_cmp_test_and,  /* test/cmp */
 739     mf_cmp_alu_cmp,  /* add/sub/cmp */
 740     mf_cmp_incdec  /* inc/dec */
 741   };
 742
 743 /* The maximum padding size for fused jcc.  CMP like instruction can
 744    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 745    prefixes.   */
 746 #define MAX_FUSED_JCC_PADDING_SIZE 20
 747
 748 /* The maximum number of prefixes added for an instruction.  */
 749 static unsigned int align_branch_prefix_size = 5;
 750
 751 /* Optimization:
 752    1. Clear the REX_W bit with register operand if possible.
 753    2. Above plus use 128bit vector instruction to clear the full vector
 754       register.
 755  */
 756 static int optimize = 0;
 757
 758 /* Optimization:
 759    1. Clear the REX_W bit with register operand if possible.
 760    2. Above plus use 128bit vector instruction to clear the full vector
 761       register.
 762    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 763       "testb $imm7,%r8".
 764  */
 765 static int optimize_for_space = 0;
 766
 767 /* Register prefix used for error message.  */
 768 static const char *register_prefix = "%";
 769
 770 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 771    leave, push, and pop instructions so that gcc has the same stack
 772    frame as in 32 bit mode.  */
 773 static char stackop_size = '\0';
 774
 775 /* Non-zero to optimize code alignment.  */
 776 int optimize_align_code = 1;
 777
 778 /* Non-zero to quieten some warnings.  */
 779 static int quiet_warnings = 0;
 780
 781 /* CPU name.  */
 782 static const char *cpu_arch_name = NULL;
 783 static char *cpu_sub_arch_name = NULL;
 784
 785 /* CPU feature flags.  */
 786 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 787
 788 /* If we have selected a cpu we are generating instructions for.  */
 789 static int cpu_arch_tune_set = 0;
 790
 791 /* Cpu we are generating instructions for.  */
 792 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 793
 794 /* CPU feature flags of cpu we are generating instructions for.  */
 795 static i386_cpu_flags cpu_arch_tune_flags;
 796
 797 /* CPU instruction set architecture used.  */
 798 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 799
 800 /* CPU feature flags of instruction set architecture used.  */
 801 i386_cpu_flags cpu_arch_isa_flags;
 802
 803 /* If set, conditional jumps are not automatically promoted to handle
 804    larger than a byte offset.  */
 805 static unsigned int no_cond_jump_promotion = 0;
 806
 807 /* Encode SSE instructions with VEX prefix.  */
 808 static unsigned int sse2avx;
 809
 810 /* Encode scalar AVX instructions with specific vector length.  */
 811 static enum
 812   {
 813     vex128 = 0,
 814     vex256
 815   } avxscalar;
 816
 817 /* Encode VEX WIG instructions with specific vex.w.  */
 818 static enum
 819   {
 820     vexw0 = 0,
 821     vexw1
 822   } vexwig;
 823
 824 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 825 static enum
 826   {
 827     evexl128 = 0,
 828     evexl256,
 829     evexl512
 830   } evexlig;
 831
 832 /* Encode EVEX WIG instructions with specific evex.w.  */
 833 static enum
 834   {
 835     evexw0 = 0,
 836     evexw1
 837   } evexwig;
 838
 839 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 840 static enum rc_type evexrcig = rne;
 841
 842 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 843 static symbolS *GOT_symbol;
 844
 845 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 846 unsigned int x86_dwarf2_return_column;
 847
 848 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 849 int x86_cie_data_alignment;
 850
 851 /* Interface to relax_segment.
 852    There are 3 major relax states for 386 jump insns because the
 853    different types of jumps add different sizes to frags when we're
 854    figuring out what sort of jump to choose to reach a given label.
 855
 856    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 857    branches which are handled by md_estimate_size_before_relax() and
 858    i386_generic_table_relax_frag().  */
 859
 860 /* Types.  */
 861 #define UNCOND_JUMP 0
 862 #define COND_JUMP 1
 863 #define COND_JUMP86 2
 864 #define BRANCH_PADDING 3
 865 #define BRANCH_PREFIX 4
 866 #define FUSED_JCC_PADDING 5
 867
 868 /* Sizes.  */
 869 #define CODE16  1
 870 #define SMALL   0
 871 #define SMALL16 (SMALL | CODE16)
 872 #define BIG     2
 873 #define BIG16   (BIG | CODE16)
 874
 875 #ifndef INLINE
 876 #ifdef __GNUC__
 877 #define INLINE __inline__
 878 #else
 879 #define INLINE
 880 #endif
 881 #endif
 882
 883 #define ENCODE_RELAX_STATE(type, size) \
 884   ((relax_substateT) (((type) << 2) | (size)))
 885 #define TYPE_FROM_RELAX_STATE(s) \
 886   ((s) >> 2)
 887 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 888     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 889
 890 /* This table is used by relax_frag to promote short jumps to long
 891    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 892    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 893    don't allow a short jump in a 32 bit code segment to be promoted to
 894    a 16 bit offset jump because it's slower (requires data size
 895    prefix), and doesn't work, unless the destination is in the bottom
 896    64k of the code segment (The top 16 bits of eip are zeroed).  */
 897
 898 const relax_typeS md_relax_table[] =
 899 {
 900   /* The fields are:
 901      1) most positive reach of this state,
 902      2) most negative reach of this state,
 903      3) how many bytes this mode will have in the variable part of the frag
 904      4) which index into the table to try if we can't fit into this one.  */
 905
 906   /* UNCOND_JUMP states.  */
 907   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 908   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 909   /* dword jmp adds 4 bytes to frag:
 910      0 extra opcode bytes, 4 displacement bytes.  */
 911   {0, 0, 4, 0},
 912   /* word jmp adds 2 byte2 to frag:
 913      0 extra opcode bytes, 2 displacement bytes.  */
 914   {0, 0, 2, 0},
 915
 916   /* COND_JUMP states.  */
 917   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 918   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 919   /* dword conditionals adds 5 bytes to frag:
 920      1 extra opcode byte, 4 displacement bytes.  */
 921   {0, 0, 5, 0},
 922   /* word conditionals add 3 bytes to frag:
 923      1 extra opcode byte, 2 displacement bytes.  */
 924   {0, 0, 3, 0},
 925
 926   /* COND_JUMP86 states.  */
 927   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 928   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 929   /* dword conditionals adds 5 bytes to frag:
 930      1 extra opcode byte, 4 displacement bytes.  */
 931   {0, 0, 5, 0},
 932   /* word conditionals add 4 bytes to frag:
 933      1 displacement byte and a 3 byte long branch insn.  */
 934   {0, 0, 4, 0}
 935 };
 936
 937 static const arch_entry cpu_arch[] =
 938 {
 939   /* Do not replace the first two entries - i386_target_format()
 940      relies on them being there in this order.  */
 941   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 942     CPU_GENERIC32_FLAGS, 0 },
 943   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 944     CPU_GENERIC64_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 946     CPU_NONE_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 948     CPU_I186_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 950     CPU_I286_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 952     CPU_I386_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 954     CPU_I486_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 956     CPU_I586_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 958     CPU_I686_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 960     CPU_I586_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 962     CPU_PENTIUMPRO_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 964     CPU_P2_FLAGS, 0 },
 965   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 966     CPU_P3_FLAGS, 0 },
 967   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 968     CPU_P4_FLAGS, 0 },
 969   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 970     CPU_CORE_FLAGS, 0 },
 971   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 972     CPU_NOCONA_FLAGS, 0 },
 973   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 974     CPU_CORE_FLAGS, 1 },
 975   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 976     CPU_CORE_FLAGS, 0 },
 977   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 978     CPU_CORE2_FLAGS, 1 },
 979   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 980     CPU_CORE2_FLAGS, 0 },
 981   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 982     CPU_COREI7_FLAGS, 0 },
 983   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 984     CPU_L1OM_FLAGS, 0 },
 985   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 986     CPU_K1OM_FLAGS, 0 },
 987   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 988     CPU_IAMCU_FLAGS, 0 },
 989   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 990     CPU_K6_FLAGS, 0 },
 991   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 992     CPU_K6_2_FLAGS, 0 },
 993   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 994     CPU_ATHLON_FLAGS, 0 },
 995   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 996     CPU_K8_FLAGS, 1 },
 997   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 998     CPU_K8_FLAGS, 0 },
 999   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1000     CPU_K8_FLAGS, 0 },
1001   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1002     CPU_AMDFAM10_FLAGS, 0 },
1003   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1004     CPU_BDVER1_FLAGS, 0 },
1005   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1006     CPU_BDVER2_FLAGS, 0 },
1007   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1008     CPU_BDVER3_FLAGS, 0 },
1009   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1010     CPU_BDVER4_FLAGS, 0 },
1011   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1012     CPU_ZNVER1_FLAGS, 0 },
1013   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1014     CPU_ZNVER2_FLAGS, 0 },
1015   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1016     CPU_BTVER1_FLAGS, 0 },
1017   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1018     CPU_BTVER2_FLAGS, 0 },
1019   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1020     CPU_8087_FLAGS, 0 },
1021   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1022     CPU_287_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1024     CPU_387_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1026     CPU_687_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1028     CPU_CMOV_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1030     CPU_FXSR_FLAGS, 0 },
1031   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1032     CPU_MMX_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1034     CPU_SSE_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1036     CPU_SSE2_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1038     CPU_SSE3_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1040     CPU_SSE4A_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1042     CPU_SSSE3_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1044     CPU_SSE4_1_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1046     CPU_SSE4_2_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1048     CPU_SSE4_2_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1050     CPU_AVX_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1052     CPU_AVX2_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1054     CPU_AVX512F_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1056     CPU_AVX512CD_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1058     CPU_AVX512ER_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1060     CPU_AVX512PF_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1062     CPU_AVX512DQ_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1064     CPU_AVX512BW_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1066     CPU_AVX512VL_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1068     CPU_VMX_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1070     CPU_VMFUNC_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1072     CPU_SMX_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1074     CPU_XSAVE_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1076     CPU_XSAVEOPT_FLAGS, 0 },
1077   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1078     CPU_XSAVEC_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1080     CPU_XSAVES_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1082     CPU_AES_FLAGS, 0 },
1083   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1084     CPU_PCLMUL_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1086     CPU_PCLMUL_FLAGS, 1 },
1087   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1088     CPU_FSGSBASE_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1090     CPU_RDRND_FLAGS, 0 },
1091   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1092     CPU_F16C_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1094     CPU_BMI2_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1096     CPU_FMA_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1098     CPU_FMA4_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1100     CPU_XOP_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1102     CPU_LWP_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1104     CPU_MOVBE_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1106     CPU_CX16_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1108     CPU_EPT_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1110     CPU_LZCNT_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1112     CPU_POPCNT_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1114     CPU_HLE_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1116     CPU_RTM_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1118     CPU_INVPCID_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1120     CPU_CLFLUSH_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1122     CPU_NOP_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1124     CPU_SYSCALL_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1126     CPU_RDTSCP_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1128     CPU_3DNOW_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1130     CPU_3DNOWA_FLAGS, 0 },
1131   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1132     CPU_PADLOCK_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1134     CPU_SVME_FLAGS, 1 },
1135   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1136     CPU_SVME_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1138     CPU_SSE4A_FLAGS, 0 },
1139   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1140     CPU_ABM_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1142     CPU_BMI_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1144     CPU_TBM_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1146     CPU_ADX_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1148     CPU_RDSEED_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1150     CPU_PRFCHW_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1152     CPU_SMAP_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1154     CPU_MPX_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1156     CPU_SHA_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1158     CPU_CLFLUSHOPT_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1160     CPU_PREFETCHWT1_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1162     CPU_SE1_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1164     CPU_CLWB_FLAGS, 0 },
1165   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1166     CPU_AVX512IFMA_FLAGS, 0 },
1167   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1168     CPU_AVX512VBMI_FLAGS, 0 },
1169   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1170     CPU_AVX512_4FMAPS_FLAGS, 0 },
1171   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1172     CPU_AVX512_4VNNIW_FLAGS, 0 },
1173   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1174     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1175   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1176     CPU_AVX512_VBMI2_FLAGS, 0 },
1177   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1178     CPU_AVX512_VNNI_FLAGS, 0 },
1179   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1180     CPU_AVX512_BITALG_FLAGS, 0 },
1181   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1182     CPU_CLZERO_FLAGS, 0 },
1183   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1184     CPU_MWAITX_FLAGS, 0 },
1185   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1186     CPU_OSPKE_FLAGS, 0 },
1187   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1188     CPU_RDPID_FLAGS, 0 },
1189   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1190     CPU_PTWRITE_FLAGS, 0 },
1191   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1192     CPU_IBT_FLAGS, 0 },
1193   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1194     CPU_SHSTK_FLAGS, 0 },
1195   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1196     CPU_GFNI_FLAGS, 0 },
1197   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1198     CPU_VAES_FLAGS, 0 },
1199   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1200     CPU_VPCLMULQDQ_FLAGS, 0 },
1201   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1202     CPU_WBNOINVD_FLAGS, 0 },
1203   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1204     CPU_PCONFIG_FLAGS, 0 },
1205   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1206     CPU_WAITPKG_FLAGS, 0 },
1207   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1208     CPU_CLDEMOTE_FLAGS, 0 },
1209   { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1210     CPU_AMX_INT8_FLAGS, 0 },
1211   { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1212     CPU_AMX_BF16_FLAGS, 0 },
1213   { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1214     CPU_AMX_TILE_FLAGS, 0 },
1215   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1216     CPU_MOVDIRI_FLAGS, 0 },
1217   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1218     CPU_MOVDIR64B_FLAGS, 0 },
1219   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1220     CPU_AVX512_BF16_FLAGS, 0 },
1221   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1222     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1223   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1224     CPU_ENQCMD_FLAGS, 0 },
1225   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1226     CPU_SERIALIZE_FLAGS, 0 },
1227   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1228     CPU_RDPRU_FLAGS, 0 },
1229   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1230     CPU_MCOMMIT_FLAGS, 0 },
1231   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1232     CPU_SEV_ES_FLAGS, 0 },
1233   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1234     CPU_TSXLDTRK_FLAGS, 0 },
1235 };
1236
1237 static const noarch_entry cpu_noarch[] =
1238 {
1239   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1240   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1241   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1242   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1243   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1244   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1245   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1246   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1247   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1248   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1249   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1250   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1251   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1252   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1253   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1254   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1255   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1256   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1257   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1258   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1259   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1260   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1261   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1262   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1263   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1264   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1265   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1266   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1267   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1268   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1269   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1270   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1271   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1272   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1273   { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1274   { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1275   { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1276   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1277   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1278   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1279   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1280     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1281   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1282   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1283   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1284 };
1285
1286 #ifdef I386COFF
1287 /* Like s_lcomm_internal in gas/read.c but the alignment string
1288    is allowed to be optional.  */
1289
1290 static symbolS *
1291 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1292 {
1293   addressT align = 0;
1294
1295   SKIP_WHITESPACE ();
1296
1297   if (needs_align
1298       && *input_line_pointer == ',')
1299     {
1300       align = parse_align (needs_align - 1);
1301
1302       if (align == (addressT) -1)
1303         return NULL;
1304     }
1305   else
1306     {
1307       if (size >= 8)
1308         align = 3;
1309       else if (size >= 4)
1310         align = 2;
1311       else if (size >= 2)
1312         align = 1;
1313       else
1314         align = 0;
1315     }
1316
1317   bss_alloc (symbolP, size, align);
1318   return symbolP;
1319 }
1320
1321 static void
1322 pe_lcomm (int needs_align)
1323 {
1324   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1325 }
1326 #endif
1327
1328 const pseudo_typeS md_pseudo_table[] =
1329 {
1330 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1331   {"align", s_align_bytes, 0},
1332 #else
1333   {"align", s_align_ptwo, 0},
1334 #endif
1335   {"arch", set_cpu_arch, 0},
1336 #ifndef I386COFF
1337   {"bss", s_bss, 0},
1338 #else
1339   {"lcomm", pe_lcomm, 1},
1340 #endif
1341   {"ffloat", float_cons, 'f'},
1342   {"dfloat", float_cons, 'd'},
1343   {"tfloat", float_cons, 'x'},
1344   {"value", cons, 2},
1345   {"slong", signed_cons, 4},
1346   {"noopt", s_ignore, 0},
1347   {"optim", s_ignore, 0},
1348   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1349   {"code16", set_code_flag, CODE_16BIT},
1350   {"code32", set_code_flag, CODE_32BIT},
1351 #ifdef BFD64
1352   {"code64", set_code_flag, CODE_64BIT},
1353 #endif
1354   {"intel_syntax", set_intel_syntax, 1},
1355   {"att_syntax", set_intel_syntax, 0},
1356   {"intel_mnemonic", set_intel_mnemonic, 1},
1357   {"att_mnemonic", set_intel_mnemonic, 0},
1358   {"allow_index_reg", set_allow_index_reg, 1},
1359   {"disallow_index_reg", set_allow_index_reg, 0},
1360   {"sse_check", set_check, 0},
1361   {"operand_check", set_check, 1},
1362 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1363   {"largecomm", handle_large_common, 0},
1364 #else
1365   {"file", dwarf2_directive_file, 0},
1366   {"loc", dwarf2_directive_loc, 0},
1367   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1368 #endif
1369 #ifdef TE_PE
1370   {"secrel32", pe_directive_secrel, 0},
1371 #endif
1372   {0, 0, 0}
1373 };
1374
1375 /* For interface with expression ().  */
1376 extern char *input_line_pointer;
1377
1378 /* Hash table for instruction mnemonic lookup.  */
1379 static htab_t op_hash;
1380
1381 /* Hash table for register lookup.  */
1382 static htab_t reg_hash;
1383 \f
1384   /* Various efficient no-op patterns for aligning code labels.
1385      Note: Don't try to assemble the instructions in the comments.
1386      0L and 0w are not legal.  */
1387 static const unsigned char f32_1[] =
1388   {0x90};                               /* nop                  */
1389 static const unsigned char f32_2[] =
1390   {0x66,0x90};                          /* xchg %ax,%ax         */
1391 static const unsigned char f32_3[] =
1392   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1393 static const unsigned char f32_4[] =
1394   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1395 static const unsigned char f32_6[] =
1396   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1397 static const unsigned char f32_7[] =
1398   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1399 static const unsigned char f16_3[] =
1400   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1401 static const unsigned char f16_4[] =
1402   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1403 static const unsigned char jump_disp8[] =
1404   {0xeb};                               /* jmp disp8           */
1405 static const unsigned char jump32_disp32[] =
1406   {0xe9};                               /* jmp disp32          */
1407 static const unsigned char jump16_disp32[] =
1408   {0x66,0xe9};                          /* jmp disp32          */
1409 /* 32-bit NOPs patterns.  */
1410 static const unsigned char *const f32_patt[] = {
1411   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1412 };
1413 /* 16-bit NOPs patterns.  */
1414 static const unsigned char *const f16_patt[] = {
1415   f32_1, f32_2, f16_3, f16_4
1416 };
1417 /* nopl (%[re]ax) */
1418 static const unsigned char alt_3[] =
1419   {0x0f,0x1f,0x00};
1420 /* nopl 0(%[re]ax) */
1421 static const unsigned char alt_4[] =
1422   {0x0f,0x1f,0x40,0x00};
1423 /* nopl 0(%[re]ax,%[re]ax,1) */
1424 static const unsigned char alt_5[] =
1425   {0x0f,0x1f,0x44,0x00,0x00};
1426 /* nopw 0(%[re]ax,%[re]ax,1) */
1427 static const unsigned char alt_6[] =
1428   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1429 /* nopl 0L(%[re]ax) */
1430 static const unsigned char alt_7[] =
1431   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1432 /* nopl 0L(%[re]ax,%[re]ax,1) */
1433 static const unsigned char alt_8[] =
1434   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1435 /* nopw 0L(%[re]ax,%[re]ax,1) */
1436 static const unsigned char alt_9[] =
1437   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1438 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1439 static const unsigned char alt_10[] =
1440   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1441 /* data16 nopw %cs:0L(%eax,%eax,1) */
1442 static const unsigned char alt_11[] =
1443   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1444 /* 32-bit and 64-bit NOPs patterns.  */
1445 static const unsigned char *const alt_patt[] = {
1446   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1447   alt_9, alt_10, alt_11
1448 };
1449
1450 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1451    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1452
1453 static void
1454 i386_output_nops (char *where, const unsigned char *const *patt,
1455                   int count, int max_single_nop_size)
1456
1457 {
1458   /* Place the longer NOP first.  */
1459   int last;
1460   int offset;
1461   const unsigned char *nops;
1462
1463   if (max_single_nop_size < 1)
1464     {
1465       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1466                 max_single_nop_size);
1467       return;
1468     }
1469
1470   nops = patt[max_single_nop_size - 1];
1471
1472   /* Use the smaller one if the requsted one isn't available.  */
1473   if (nops == NULL)
1474     {
1475       max_single_nop_size--;
1476       nops = patt[max_single_nop_size - 1];
1477     }
1478
1479   last = count % max_single_nop_size;
1480
1481   count -= last;
1482   for (offset = 0; offset < count; offset += max_single_nop_size)
1483     memcpy (where + offset, nops, max_single_nop_size);
1484
1485   if (last)
1486     {
1487       nops = patt[last - 1];
1488       if (nops == NULL)
1489         {
1490           /* Use the smaller one plus one-byte NOP if the needed one
1491              isn't available.  */
1492           last--;
1493           nops = patt[last - 1];
1494           memcpy (where + offset, nops, last);
1495           where[offset + last] = *patt[0];
1496         }
1497       else
1498         memcpy (where + offset, nops, last);
1499     }
1500 }
1501
1502 static INLINE int
1503 fits_in_imm7 (offsetT num)
1504 {
1505   return (num & 0x7f) == num;
1506 }
1507
1508 static INLINE int
1509 fits_in_imm31 (offsetT num)
1510 {
1511   return (num & 0x7fffffff) == num;
1512 }
1513
1514 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1515    single NOP instruction LIMIT.  */
1516
1517 void
1518 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1519 {
1520   const unsigned char *const *patt = NULL;
1521   int max_single_nop_size;
1522   /* Maximum number of NOPs before switching to jump over NOPs.  */
1523   int max_number_of_nops;
1524
1525   switch (fragP->fr_type)
1526     {
1527     case rs_fill_nop:
1528     case rs_align_code:
1529       break;
1530     case rs_machine_dependent:
1531       /* Allow NOP padding for jumps and calls.  */
1532       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1533           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1534         break;
1535       /* Fall through.  */
1536     default:
1537       return;
1538     }
1539
1540   /* We need to decide which NOP sequence to use for 32bit and
1541      64bit. When -mtune= is used:
1542
1543      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1544      PROCESSOR_GENERIC32, f32_patt will be used.
1545      2. For the rest, alt_patt will be used.
1546
1547      When -mtune= isn't used, alt_patt will be used if
1548      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1549      be used.
1550
1551      When -march= or .arch is used, we can't use anything beyond
1552      cpu_arch_isa_flags.   */
1553
1554   if (flag_code == CODE_16BIT)
1555     {
1556       patt = f16_patt;
1557       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1558       /* Limit number of NOPs to 2 in 16-bit mode.  */
1559       max_number_of_nops = 2;
1560     }
1561   else
1562     {
1563       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1564         {
1565           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1566           switch (cpu_arch_tune)
1567             {
1568             case PROCESSOR_UNKNOWN:
1569               /* We use cpu_arch_isa_flags to check if we SHOULD
1570                  optimize with nops.  */
1571               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1572                 patt = alt_patt;
1573               else
1574                 patt = f32_patt;
1575               break;
1576             case PROCESSOR_PENTIUM4:
1577             case PROCESSOR_NOCONA:
1578             case PROCESSOR_CORE:
1579             case PROCESSOR_CORE2:
1580             case PROCESSOR_COREI7:
1581             case PROCESSOR_L1OM:
1582             case PROCESSOR_K1OM:
1583             case PROCESSOR_GENERIC64:
1584             case PROCESSOR_K6:
1585             case PROCESSOR_ATHLON:
1586             case PROCESSOR_K8:
1587             case PROCESSOR_AMDFAM10:
1588             case PROCESSOR_BD:
1589             case PROCESSOR_ZNVER:
1590             case PROCESSOR_BT:
1591               patt = alt_patt;
1592               break;
1593             case PROCESSOR_I386:
1594             case PROCESSOR_I486:
1595             case PROCESSOR_PENTIUM:
1596             case PROCESSOR_PENTIUMPRO:
1597             case PROCESSOR_IAMCU:
1598             case PROCESSOR_GENERIC32:
1599               patt = f32_patt;
1600               break;
1601             }
1602         }
1603       else
1604         {
1605           switch (fragP->tc_frag_data.tune)
1606             {
1607             case PROCESSOR_UNKNOWN:
1608               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1609                  PROCESSOR_UNKNOWN.  */
1610               abort ();
1611               break;
1612
1613             case PROCESSOR_I386:
1614             case PROCESSOR_I486:
1615             case PROCESSOR_PENTIUM:
1616             case PROCESSOR_IAMCU:
1617             case PROCESSOR_K6:
1618             case PROCESSOR_ATHLON:
1619             case PROCESSOR_K8:
1620             case PROCESSOR_AMDFAM10:
1621             case PROCESSOR_BD:
1622             case PROCESSOR_ZNVER:
1623             case PROCESSOR_BT:
1624             case PROCESSOR_GENERIC32:
1625               /* We use cpu_arch_isa_flags to check if we CAN optimize
1626                  with nops.  */
1627               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1628                 patt = alt_patt;
1629               else
1630                 patt = f32_patt;
1631               break;
1632             case PROCESSOR_PENTIUMPRO:
1633             case PROCESSOR_PENTIUM4:
1634             case PROCESSOR_NOCONA:
1635             case PROCESSOR_CORE:
1636             case PROCESSOR_CORE2:
1637             case PROCESSOR_COREI7:
1638             case PROCESSOR_L1OM:
1639             case PROCESSOR_K1OM:
1640               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1641                 patt = alt_patt;
1642               else
1643                 patt = f32_patt;
1644               break;
1645             case PROCESSOR_GENERIC64:
1646               patt = alt_patt;
1647               break;
1648             }
1649         }
1650
1651       if (patt == f32_patt)
1652         {
1653           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1654           /* Limit number of NOPs to 2 for older processors.  */
1655           max_number_of_nops = 2;
1656         }
1657       else
1658         {
1659           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1660           /* Limit number of NOPs to 7 for newer processors.  */
1661           max_number_of_nops = 7;
1662         }
1663     }
1664
1665   if (limit == 0)
1666     limit = max_single_nop_size;
1667
1668   if (fragP->fr_type == rs_fill_nop)
1669     {
1670       /* Output NOPs for .nop directive.  */
1671       if (limit > max_single_nop_size)
1672         {
1673           as_bad_where (fragP->fr_file, fragP->fr_line,
1674                         _("invalid single nop size: %d "
1675                           "(expect within [0, %d])"),
1676                         limit, max_single_nop_size);
1677           return;
1678         }
1679     }
1680   else if (fragP->fr_type != rs_machine_dependent)
1681     fragP->fr_var = count;
1682
1683   if ((count / max_single_nop_size) > max_number_of_nops)
1684     {
1685       /* Generate jump over NOPs.  */
1686       offsetT disp = count - 2;
1687       if (fits_in_imm7 (disp))
1688         {
1689           /* Use "jmp disp8" if possible.  */
1690           count = disp;
1691           where[0] = jump_disp8[0];
1692           where[1] = count;
1693           where += 2;
1694         }
1695       else
1696         {
1697           unsigned int size_of_jump;
1698
1699           if (flag_code == CODE_16BIT)
1700             {
1701               where[0] = jump16_disp32[0];
1702               where[1] = jump16_disp32[1];
1703               size_of_jump = 2;
1704             }
1705           else
1706             {
1707               where[0] = jump32_disp32[0];
1708               size_of_jump = 1;
1709             }
1710
1711           count -= size_of_jump + 4;
1712           if (!fits_in_imm31 (count))
1713             {
1714               as_bad_where (fragP->fr_file, fragP->fr_line,
1715                             _("jump over nop padding out of range"));
1716               return;
1717             }
1718
1719           md_number_to_chars (where + size_of_jump, count, 4);
1720           where += size_of_jump + 4;
1721         }
1722     }
1723
1724   /* Generate multiple NOPs.  */
1725   i386_output_nops (where, patt, count, limit);
1726 }
1727
1728 static INLINE int
1729 operand_type_all_zero (const union i386_operand_type *x)
1730 {
1731   switch (ARRAY_SIZE(x->array))
1732     {
1733     case 3:
1734       if (x->array[2])
1735         return 0;
1736       /* Fall through.  */
1737     case 2:
1738       if (x->array[1])
1739         return 0;
1740       /* Fall through.  */
1741     case 1:
1742       return !x->array[0];
1743     default:
1744       abort ();
1745     }
1746 }
1747
1748 static INLINE void
1749 operand_type_set (union i386_operand_type *x, unsigned int v)
1750 {
1751   switch (ARRAY_SIZE(x->array))
1752     {
1753     case 3:
1754       x->array[2] = v;
1755       /* Fall through.  */
1756     case 2:
1757       x->array[1] = v;
1758       /* Fall through.  */
1759     case 1:
1760       x->array[0] = v;
1761       /* Fall through.  */
1762       break;
1763     default:
1764       abort ();
1765     }
1766
1767   x->bitfield.class = ClassNone;
1768   x->bitfield.instance = InstanceNone;
1769 }
1770
1771 static INLINE int
1772 operand_type_equal (const union i386_operand_type *x,
1773                     const union i386_operand_type *y)
1774 {
1775   switch (ARRAY_SIZE(x->array))
1776     {
1777     case 3:
1778       if (x->array[2] != y->array[2])
1779         return 0;
1780       /* Fall through.  */
1781     case 2:
1782       if (x->array[1] != y->array[1])
1783         return 0;
1784       /* Fall through.  */
1785     case 1:
1786       return x->array[0] == y->array[0];
1787       break;
1788     default:
1789       abort ();
1790     }
1791 }
1792
1793 static INLINE int
1794 cpu_flags_all_zero (const union i386_cpu_flags *x)
1795 {
1796   switch (ARRAY_SIZE(x->array))
1797     {
1798     case 4:
1799       if (x->array[3])
1800         return 0;
1801       /* Fall through.  */
1802     case 3:
1803       if (x->array[2])
1804         return 0;
1805       /* Fall through.  */
1806     case 2:
1807       if (x->array[1])
1808         return 0;
1809       /* Fall through.  */
1810     case 1:
1811       return !x->array[0];
1812     default:
1813       abort ();
1814     }
1815 }
1816
1817 static INLINE int
1818 cpu_flags_equal (const union i386_cpu_flags *x,
1819                  const union i386_cpu_flags *y)
1820 {
1821   switch (ARRAY_SIZE(x->array))
1822     {
1823     case 4:
1824       if (x->array[3] != y->array[3])
1825         return 0;
1826       /* Fall through.  */
1827     case 3:
1828       if (x->array[2] != y->array[2])
1829         return 0;
1830       /* Fall through.  */
1831     case 2:
1832       if (x->array[1] != y->array[1])
1833         return 0;
1834       /* Fall through.  */
1835     case 1:
1836       return x->array[0] == y->array[0];
1837       break;
1838     default:
1839       abort ();
1840     }
1841 }
1842
1843 static INLINE int
1844 cpu_flags_check_cpu64 (i386_cpu_flags f)
1845 {
1846   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1847            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1848 }
1849
1850 static INLINE i386_cpu_flags
1851 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1852 {
1853   switch (ARRAY_SIZE (x.array))
1854     {
1855     case 4:
1856       x.array [3] &= y.array [3];
1857       /* Fall through.  */
1858     case 3:
1859       x.array [2] &= y.array [2];
1860       /* Fall through.  */
1861     case 2:
1862       x.array [1] &= y.array [1];
1863       /* Fall through.  */
1864     case 1:
1865       x.array [0] &= y.array [0];
1866       break;
1867     default:
1868       abort ();
1869     }
1870   return x;
1871 }
1872
1873 static INLINE i386_cpu_flags
1874 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1875 {
1876   switch (ARRAY_SIZE (x.array))
1877     {
1878     case 4:
1879       x.array [3] |= y.array [3];
1880       /* Fall through.  */
1881     case 3:
1882       x.array [2] |= y.array [2];
1883       /* Fall through.  */
1884     case 2:
1885       x.array [1] |= y.array [1];
1886       /* Fall through.  */
1887     case 1:
1888       x.array [0] |= y.array [0];
1889       break;
1890     default:
1891       abort ();
1892     }
1893   return x;
1894 }
1895
1896 static INLINE i386_cpu_flags
1897 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1898 {
1899   switch (ARRAY_SIZE (x.array))
1900     {
1901     case 4:
1902       x.array [3] &= ~y.array [3];
1903       /* Fall through.  */
1904     case 3:
1905       x.array [2] &= ~y.array [2];
1906       /* Fall through.  */
1907     case 2:
1908       x.array [1] &= ~y.array [1];
1909       /* Fall through.  */
1910     case 1:
1911       x.array [0] &= ~y.array [0];
1912       break;
1913     default:
1914       abort ();
1915     }
1916   return x;
1917 }
1918
1919 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1920
1921 #define CPU_FLAGS_ARCH_MATCH            0x1
1922 #define CPU_FLAGS_64BIT_MATCH           0x2
1923
1924 #define CPU_FLAGS_PERFECT_MATCH \
1925   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1926
1927 /* Return CPU flags match bits. */
1928
1929 static int
1930 cpu_flags_match (const insn_template *t)
1931 {
1932   i386_cpu_flags x = t->cpu_flags;
1933   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1934
1935   x.bitfield.cpu64 = 0;
1936   x.bitfield.cpuno64 = 0;
1937
1938   if (cpu_flags_all_zero (&x))
1939     {
1940       /* This instruction is available on all archs.  */
1941       match |= CPU_FLAGS_ARCH_MATCH;
1942     }
1943   else
1944     {
1945       /* This instruction is available only on some archs.  */
1946       i386_cpu_flags cpu = cpu_arch_flags;
1947
1948       /* AVX512VL is no standalone feature - match it and then strip it.  */
1949       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1950         return match;
1951       x.bitfield.cpuavx512vl = 0;
1952
1953       cpu = cpu_flags_and (x, cpu);
1954       if (!cpu_flags_all_zero (&cpu))
1955         {
1956           if (x.bitfield.cpuavx)
1957             {
1958               /* We need to check a few extra flags with AVX.  */
1959               if (cpu.bitfield.cpuavx
1960                   && (!t->opcode_modifier.sse2avx
1961                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1962                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1963                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1964                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1965                 match |= CPU_FLAGS_ARCH_MATCH;
1966             }
1967           else if (x.bitfield.cpuavx512f)
1968             {
1969               /* We need to check a few extra flags with AVX512F.  */
1970               if (cpu.bitfield.cpuavx512f
1971                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1972                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1973                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1974                 match |= CPU_FLAGS_ARCH_MATCH;
1975             }
1976           else
1977             match |= CPU_FLAGS_ARCH_MATCH;
1978         }
1979     }
1980   return match;
1981 }
1982
1983 static INLINE i386_operand_type
1984 operand_type_and (i386_operand_type x, i386_operand_type y)
1985 {
1986   if (x.bitfield.class != y.bitfield.class)
1987     x.bitfield.class = ClassNone;
1988   if (x.bitfield.instance != y.bitfield.instance)
1989     x.bitfield.instance = InstanceNone;
1990
1991   switch (ARRAY_SIZE (x.array))
1992     {
1993     case 3:
1994       x.array [2] &= y.array [2];
1995       /* Fall through.  */
1996     case 2:
1997       x.array [1] &= y.array [1];
1998       /* Fall through.  */
1999     case 1:
2000       x.array [0] &= y.array [0];
2001       break;
2002     default:
2003       abort ();
2004     }
2005   return x;
2006 }
2007
2008 static INLINE i386_operand_type
2009 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2010 {
2011   gas_assert (y.bitfield.class == ClassNone);
2012   gas_assert (y.bitfield.instance == InstanceNone);
2013
2014   switch (ARRAY_SIZE (x.array))
2015     {
2016     case 3:
2017       x.array [2] &= ~y.array [2];
2018       /* Fall through.  */
2019     case 2:
2020       x.array [1] &= ~y.array [1];
2021       /* Fall through.  */
2022     case 1:
2023       x.array [0] &= ~y.array [0];
2024       break;
2025     default:
2026       abort ();
2027     }
2028   return x;
2029 }
2030
2031 static INLINE i386_operand_type
2032 operand_type_or (i386_operand_type x, i386_operand_type y)
2033 {
2034   gas_assert (x.bitfield.class == ClassNone ||
2035               y.bitfield.class == ClassNone ||
2036               x.bitfield.class == y.bitfield.class);
2037   gas_assert (x.bitfield.instance == InstanceNone ||
2038               y.bitfield.instance == InstanceNone ||
2039               x.bitfield.instance == y.bitfield.instance);
2040
2041   switch (ARRAY_SIZE (x.array))
2042     {
2043     case 3:
2044       x.array [2] |= y.array [2];
2045       /* Fall through.  */
2046     case 2:
2047       x.array [1] |= y.array [1];
2048       /* Fall through.  */
2049     case 1:
2050       x.array [0] |= y.array [0];
2051       break;
2052     default:
2053       abort ();
2054     }
2055   return x;
2056 }
2057
2058 static INLINE i386_operand_type
2059 operand_type_xor (i386_operand_type x, i386_operand_type y)
2060 {
2061   gas_assert (y.bitfield.class == ClassNone);
2062   gas_assert (y.bitfield.instance == InstanceNone);
2063
2064   switch (ARRAY_SIZE (x.array))
2065     {
2066     case 3:
2067       x.array [2] ^= y.array [2];
2068       /* Fall through.  */
2069     case 2:
2070       x.array [1] ^= y.array [1];
2071       /* Fall through.  */
2072     case 1:
2073       x.array [0] ^= y.array [0];
2074       break;
2075     default:
2076       abort ();
2077     }
2078   return x;
2079 }
2080
2081 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2082 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2083 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2084 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2085 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2086 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2087 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2088 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2089 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2090 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2091 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2092 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2093 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2094 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2095 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2096 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2097 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2098
2099 enum operand_type
2100 {
2101   reg,
2102   imm,
2103   disp,
2104   anymem
2105 };
2106
2107 static INLINE int
2108 operand_type_check (i386_operand_type t, enum operand_type c)
2109 {
2110   switch (c)
2111     {
2112     case reg:
2113       return t.bitfield.class == Reg;
2114
2115     case imm:
2116       return (t.bitfield.imm8
2117               || t.bitfield.imm8s
2118               || t.bitfield.imm16
2119               || t.bitfield.imm32
2120               || t.bitfield.imm32s
2121               || t.bitfield.imm64);
2122
2123     case disp:
2124       return (t.bitfield.disp8
2125               || t.bitfield.disp16
2126               || t.bitfield.disp32
2127               || t.bitfield.disp32s
2128               || t.bitfield.disp64);
2129
2130     case anymem:
2131       return (t.bitfield.disp8
2132               || t.bitfield.disp16
2133               || t.bitfield.disp32
2134               || t.bitfield.disp32s
2135               || t.bitfield.disp64
2136               || t.bitfield.baseindex);
2137
2138     default:
2139       abort ();
2140     }
2141
2142   return 0;
2143 }
2144
2145 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2146    between operand GIVEN and opeand WANTED for instruction template T.  */
2147
2148 static INLINE int
2149 match_operand_size (const insn_template *t, unsigned int wanted,
2150                     unsigned int given)
2151 {
2152   return !((i.types[given].bitfield.byte
2153             && !t->operand_types[wanted].bitfield.byte)
2154            || (i.types[given].bitfield.word
2155                && !t->operand_types[wanted].bitfield.word)
2156            || (i.types[given].bitfield.dword
2157                && !t->operand_types[wanted].bitfield.dword)
2158            || (i.types[given].bitfield.qword
2159                && !t->operand_types[wanted].bitfield.qword)
2160            || (i.types[given].bitfield.tbyte
2161                && !t->operand_types[wanted].bitfield.tbyte));
2162 }
2163
2164 /* Return 1 if there is no conflict in SIMD register between operand
2165    GIVEN and opeand WANTED for instruction template T.  */
2166
2167 static INLINE int
2168 match_simd_size (const insn_template *t, unsigned int wanted,
2169                  unsigned int given)
2170 {
2171   return !((i.types[given].bitfield.xmmword
2172             && !t->operand_types[wanted].bitfield.xmmword)
2173            || (i.types[given].bitfield.ymmword
2174                && !t->operand_types[wanted].bitfield.ymmword)
2175            || (i.types[given].bitfield.zmmword
2176                && !t->operand_types[wanted].bitfield.zmmword)
2177            || (i.types[given].bitfield.tmmword
2178                && !t->operand_types[wanted].bitfield.tmmword));
2179 }
2180
2181 /* Return 1 if there is no conflict in any size between operand GIVEN
2182    and opeand WANTED for instruction template T.  */
2183
2184 static INLINE int
2185 match_mem_size (const insn_template *t, unsigned int wanted,
2186                 unsigned int given)
2187 {
2188   return (match_operand_size (t, wanted, given)
2189           && !((i.types[given].bitfield.unspecified
2190                 && !i.broadcast
2191                 && !t->operand_types[wanted].bitfield.unspecified)
2192                || (i.types[given].bitfield.fword
2193                    && !t->operand_types[wanted].bitfield.fword)
2194                /* For scalar opcode templates to allow register and memory
2195                   operands at the same time, some special casing is needed
2196                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2197                   down-conversion vpmov*.  */
2198                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2199                     && t->operand_types[wanted].bitfield.byte
2200                        + t->operand_types[wanted].bitfield.word
2201                        + t->operand_types[wanted].bitfield.dword
2202                        + t->operand_types[wanted].bitfield.qword
2203                        > !!t->opcode_modifier.broadcast)
2204                    ? (i.types[given].bitfield.xmmword
2205                       || i.types[given].bitfield.ymmword
2206                       || i.types[given].bitfield.zmmword)
2207                    : !match_simd_size(t, wanted, given))));
2208 }
2209
2210 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2211    operands for instruction template T, and it has MATCH_REVERSE set if there
2212    is no size conflict on any operands for the template with operands reversed
2213    (and the template allows for reversing in the first place).  */
2214
2215 #define MATCH_STRAIGHT 1
2216 #define MATCH_REVERSE  2
2217
2218 static INLINE unsigned int
2219 operand_size_match (const insn_template *t)
2220 {
2221   unsigned int j, match = MATCH_STRAIGHT;
2222
2223   /* Don't check non-absolute jump instructions.  */
2224   if (t->opcode_modifier.jump
2225       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2226     return match;
2227
2228   /* Check memory and accumulator operand size.  */
2229   for (j = 0; j < i.operands; j++)
2230     {
2231       if (i.types[j].bitfield.class != Reg
2232           && i.types[j].bitfield.class != RegSIMD
2233           && t->opcode_modifier.anysize)
2234         continue;
2235
2236       if (t->operand_types[j].bitfield.class == Reg
2237           && !match_operand_size (t, j, j))
2238         {
2239           match = 0;
2240           break;
2241         }
2242
2243       if (t->operand_types[j].bitfield.class == RegSIMD
2244           && !match_simd_size (t, j, j))
2245         {
2246           match = 0;
2247           break;
2248         }
2249
2250       if (t->operand_types[j].bitfield.instance == Accum
2251           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2252         {
2253           match = 0;
2254           break;
2255         }
2256
2257       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2258         {
2259           match = 0;
2260           break;
2261         }
2262     }
2263
2264   if (!t->opcode_modifier.d)
2265     {
2266     mismatch:
2267       if (!match)
2268         i.error = operand_size_mismatch;
2269       return match;
2270     }
2271
2272   /* Check reverse.  */
2273   gas_assert (i.operands >= 2 && i.operands <= 3);
2274
2275   for (j = 0; j < i.operands; j++)
2276     {
2277       unsigned int given = i.operands - j - 1;
2278
2279       if (t->operand_types[j].bitfield.class == Reg
2280           && !match_operand_size (t, j, given))
2281         goto mismatch;
2282
2283       if (t->operand_types[j].bitfield.class == RegSIMD
2284           && !match_simd_size (t, j, given))
2285         goto mismatch;
2286
2287       if (t->operand_types[j].bitfield.instance == Accum
2288           && (!match_operand_size (t, j, given)
2289               || !match_simd_size (t, j, given)))
2290         goto mismatch;
2291
2292       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2293         goto mismatch;
2294     }
2295
2296   return match | MATCH_REVERSE;
2297 }
2298
2299 static INLINE int
2300 operand_type_match (i386_operand_type overlap,
2301                     i386_operand_type given)
2302 {
2303   i386_operand_type temp = overlap;
2304
2305   temp.bitfield.unspecified = 0;
2306   temp.bitfield.byte = 0;
2307   temp.bitfield.word = 0;
2308   temp.bitfield.dword = 0;
2309   temp.bitfield.fword = 0;
2310   temp.bitfield.qword = 0;
2311   temp.bitfield.tbyte = 0;
2312   temp.bitfield.xmmword = 0;
2313   temp.bitfield.ymmword = 0;
2314   temp.bitfield.zmmword = 0;
2315   temp.bitfield.tmmword = 0;
2316   if (operand_type_all_zero (&temp))
2317     goto mismatch;
2318
2319   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2320     return 1;
2321
2322  mismatch:
2323   i.error = operand_type_mismatch;
2324   return 0;
2325 }
2326
2327 /* If given types g0 and g1 are registers they must be of the same type
2328    unless the expected operand type register overlap is null.
2329    Some Intel syntax memory operand size checking also happens here.  */
2330
2331 static INLINE int
2332 operand_type_register_match (i386_operand_type g0,
2333                              i386_operand_type t0,
2334                              i386_operand_type g1,
2335                              i386_operand_type t1)
2336 {
2337   if (g0.bitfield.class != Reg
2338       && g0.bitfield.class != RegSIMD
2339       && (!operand_type_check (g0, anymem)
2340           || g0.bitfield.unspecified
2341           || (t0.bitfield.class != Reg
2342               && t0.bitfield.class != RegSIMD)))
2343     return 1;
2344
2345   if (g1.bitfield.class != Reg
2346       && g1.bitfield.class != RegSIMD
2347       && (!operand_type_check (g1, anymem)
2348           || g1.bitfield.unspecified
2349           || (t1.bitfield.class != Reg
2350               && t1.bitfield.class != RegSIMD)))
2351     return 1;
2352
2353   if (g0.bitfield.byte == g1.bitfield.byte
2354       && g0.bitfield.word == g1.bitfield.word
2355       && g0.bitfield.dword == g1.bitfield.dword
2356       && g0.bitfield.qword == g1.bitfield.qword
2357       && g0.bitfield.xmmword == g1.bitfield.xmmword
2358       && g0.bitfield.ymmword == g1.bitfield.ymmword
2359       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2360     return 1;
2361
2362   if (!(t0.bitfield.byte & t1.bitfield.byte)
2363       && !(t0.bitfield.word & t1.bitfield.word)
2364       && !(t0.bitfield.dword & t1.bitfield.dword)
2365       && !(t0.bitfield.qword & t1.bitfield.qword)
2366       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2367       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2368       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2369     return 1;
2370
2371   i.error = register_type_mismatch;
2372
2373   return 0;
2374 }
2375
2376 static INLINE unsigned int
2377 register_number (const reg_entry *r)
2378 {
2379   unsigned int nr = r->reg_num;
2380
2381   if (r->reg_flags & RegRex)
2382     nr += 8;
2383
2384   if (r->reg_flags & RegVRex)
2385     nr += 16;
2386
2387   return nr;
2388 }
2389
2390 static INLINE unsigned int
2391 mode_from_disp_size (i386_operand_type t)
2392 {
2393   if (t.bitfield.disp8)
2394     return 1;
2395   else if (t.bitfield.disp16
2396            || t.bitfield.disp32
2397            || t.bitfield.disp32s)
2398     return 2;
2399   else
2400     return 0;
2401 }
2402
2403 static INLINE int
2404 fits_in_signed_byte (addressT num)
2405 {
2406   return num + 0x80 <= 0xff;
2407 }
2408
2409 static INLINE int
2410 fits_in_unsigned_byte (addressT num)
2411 {
2412   return num <= 0xff;
2413 }
2414
2415 static INLINE int
2416 fits_in_unsigned_word (addressT num)
2417 {
2418   return num <= 0xffff;
2419 }
2420
2421 static INLINE int
2422 fits_in_signed_word (addressT num)
2423 {
2424   return num + 0x8000 <= 0xffff;
2425 }
2426
2427 static INLINE int
2428 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2429 {
2430 #ifndef BFD64
2431   return 1;
2432 #else
2433   return num + 0x80000000 <= 0xffffffff;
2434 #endif
2435 }                               /* fits_in_signed_long() */
2436
2437 static INLINE int
2438 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2439 {
2440 #ifndef BFD64
2441   return 1;
2442 #else
2443   return num <= 0xffffffff;
2444 #endif
2445 }                               /* fits_in_unsigned_long() */
2446
2447 static INLINE int
2448 fits_in_disp8 (offsetT num)
2449 {
2450   int shift = i.memshift;
2451   unsigned int mask;
2452
2453   if (shift == -1)
2454     abort ();
2455
2456   mask = (1 << shift) - 1;
2457
2458   /* Return 0 if NUM isn't properly aligned.  */
2459   if ((num & mask))
2460     return 0;
2461
2462   /* Check if NUM will fit in 8bit after shift.  */
2463   return fits_in_signed_byte (num >> shift);
2464 }
2465
2466 static INLINE int
2467 fits_in_imm4 (offsetT num)
2468 {
2469   return (num & 0xf) == num;
2470 }
2471
2472 static i386_operand_type
2473 smallest_imm_type (offsetT num)
2474 {
2475   i386_operand_type t;
2476
2477   operand_type_set (&t, 0);
2478   t.bitfield.imm64 = 1;
2479
2480   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2481     {
2482       /* This code is disabled on the 486 because all the Imm1 forms
2483          in the opcode table are slower on the i486.  They're the
2484          versions with the implicitly specified single-position
2485          displacement, which has another syntax if you really want to
2486          use that form.  */
2487       t.bitfield.imm1 = 1;
2488       t.bitfield.imm8 = 1;
2489       t.bitfield.imm8s = 1;
2490       t.bitfield.imm16 = 1;
2491       t.bitfield.imm32 = 1;
2492       t.bitfield.imm32s = 1;
2493     }
2494   else if (fits_in_signed_byte (num))
2495     {
2496       t.bitfield.imm8 = 1;
2497       t.bitfield.imm8s = 1;
2498       t.bitfield.imm16 = 1;
2499       t.bitfield.imm32 = 1;
2500       t.bitfield.imm32s = 1;
2501     }
2502   else if (fits_in_unsigned_byte (num))
2503     {
2504       t.bitfield.imm8 = 1;
2505       t.bitfield.imm16 = 1;
2506       t.bitfield.imm32 = 1;
2507       t.bitfield.imm32s = 1;
2508     }
2509   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2510     {
2511       t.bitfield.imm16 = 1;
2512       t.bitfield.imm32 = 1;
2513       t.bitfield.imm32s = 1;
2514     }
2515   else if (fits_in_signed_long (num))
2516     {
2517       t.bitfield.imm32 = 1;
2518       t.bitfield.imm32s = 1;
2519     }
2520   else if (fits_in_unsigned_long (num))
2521     t.bitfield.imm32 = 1;
2522
2523   return t;
2524 }
2525
2526 static offsetT
2527 offset_in_range (offsetT val, int size)
2528 {
2529   addressT mask;
2530
2531   switch (size)
2532     {
2533     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2534     case 2: mask = ((addressT) 1 << 16) - 1; break;
2535     case 4: mask = ((addressT) 2 << 31) - 1; break;
2536 #ifdef BFD64
2537     case 8: mask = ((addressT) 2 << 63) - 1; break;
2538 #endif
2539     default: abort ();
2540     }
2541
2542   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2543     {
2544       char buf1[40], buf2[40];
2545
2546       sprint_value (buf1, val);
2547       sprint_value (buf2, val & mask);
2548       as_warn (_("%s shortened to %s"), buf1, buf2);
2549     }
2550   return val & mask;
2551 }
2552
2553 enum PREFIX_GROUP
2554 {
2555   PREFIX_EXIST = 0,
2556   PREFIX_LOCK,
2557   PREFIX_REP,
2558   PREFIX_DS,
2559   PREFIX_OTHER
2560 };
2561
2562 /* Returns
2563    a. PREFIX_EXIST if attempting to add a prefix where one from the
2564    same class already exists.
2565    b. PREFIX_LOCK if lock prefix is added.
2566    c. PREFIX_REP if rep/repne prefix is added.
2567    d. PREFIX_DS if ds prefix is added.
2568    e. PREFIX_OTHER if other prefix is added.
2569  */
2570
2571 static enum PREFIX_GROUP
2572 add_prefix (unsigned int prefix)
2573 {
2574   enum PREFIX_GROUP ret = PREFIX_OTHER;
2575   unsigned int q;
2576
2577   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2578       && flag_code == CODE_64BIT)
2579     {
2580       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2581           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2582           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2583           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2584         ret = PREFIX_EXIST;
2585       q = REX_PREFIX;
2586     }
2587   else
2588     {
2589       switch (prefix)
2590         {
2591         default:
2592           abort ();
2593
2594         case DS_PREFIX_OPCODE:
2595           ret = PREFIX_DS;
2596           /* Fall through.  */
2597         case CS_PREFIX_OPCODE:
2598         case ES_PREFIX_OPCODE:
2599         case FS_PREFIX_OPCODE:
2600         case GS_PREFIX_OPCODE:
2601         case SS_PREFIX_OPCODE:
2602           q = SEG_PREFIX;
2603           break;
2604
2605         case REPNE_PREFIX_OPCODE:
2606         case REPE_PREFIX_OPCODE:
2607           q = REP_PREFIX;
2608           ret = PREFIX_REP;
2609           break;
2610
2611         case LOCK_PREFIX_OPCODE:
2612           q = LOCK_PREFIX;
2613           ret = PREFIX_LOCK;
2614           break;
2615
2616         case FWAIT_OPCODE:
2617           q = WAIT_PREFIX;
2618           break;
2619
2620         case ADDR_PREFIX_OPCODE:
2621           q = ADDR_PREFIX;
2622           break;
2623
2624         case DATA_PREFIX_OPCODE:
2625           q = DATA_PREFIX;
2626           break;
2627         }
2628       if (i.prefix[q] != 0)
2629         ret = PREFIX_EXIST;
2630     }
2631
2632   if (ret)
2633     {
2634       if (!i.prefix[q])
2635         ++i.prefixes;
2636       i.prefix[q] |= prefix;
2637     }
2638   else
2639     as_bad (_("same type of prefix used twice"));
2640
2641   return ret;
2642 }
2643
2644 static void
2645 update_code_flag (int value, int check)
2646 {
2647   PRINTF_LIKE ((*as_error));
2648
2649   flag_code = (enum flag_code) value;
2650   if (flag_code == CODE_64BIT)
2651     {
2652       cpu_arch_flags.bitfield.cpu64 = 1;
2653       cpu_arch_flags.bitfield.cpuno64 = 0;
2654     }
2655   else
2656     {
2657       cpu_arch_flags.bitfield.cpu64 = 0;
2658       cpu_arch_flags.bitfield.cpuno64 = 1;
2659     }
2660   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2661     {
2662       if (check)
2663         as_error = as_fatal;
2664       else
2665         as_error = as_bad;
2666       (*as_error) (_("64bit mode not supported on `%s'."),
2667                    cpu_arch_name ? cpu_arch_name : default_arch);
2668     }
2669   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2670     {
2671       if (check)
2672         as_error = as_fatal;
2673       else
2674         as_error = as_bad;
2675       (*as_error) (_("32bit mode not supported on `%s'."),
2676                    cpu_arch_name ? cpu_arch_name : default_arch);
2677     }
2678   stackop_size = '\0';
2679 }
2680
2681 static void
2682 set_code_flag (int value)
2683 {
2684   update_code_flag (value, 0);
2685 }
2686
2687 static void
2688 set_16bit_gcc_code_flag (int new_code_flag)
2689 {
2690   flag_code = (enum flag_code) new_code_flag;
2691   if (flag_code != CODE_16BIT)
2692     abort ();
2693   cpu_arch_flags.bitfield.cpu64 = 0;
2694   cpu_arch_flags.bitfield.cpuno64 = 1;
2695   stackop_size = LONG_MNEM_SUFFIX;
2696 }
2697
2698 static void
2699 set_intel_syntax (int syntax_flag)
2700 {
2701   /* Find out if register prefixing is specified.  */
2702   int ask_naked_reg = 0;
2703
2704   SKIP_WHITESPACE ();
2705   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2706     {
2707       char *string;
2708       int e = get_symbol_name (&string);
2709
2710       if (strcmp (string, "prefix") == 0)
2711         ask_naked_reg = 1;
2712       else if (strcmp (string, "noprefix") == 0)
2713         ask_naked_reg = -1;
2714       else
2715         as_bad (_("bad argument to syntax directive."));
2716       (void) restore_line_pointer (e);
2717     }
2718   demand_empty_rest_of_line ();
2719
2720   intel_syntax = syntax_flag;
2721
2722   if (ask_naked_reg == 0)
2723     allow_naked_reg = (intel_syntax
2724                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2725   else
2726     allow_naked_reg = (ask_naked_reg < 0);
2727
2728   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2729
2730   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2731   identifier_chars['$'] = intel_syntax ? '$' : 0;
2732   register_prefix = allow_naked_reg ? "" : "%";
2733 }
2734
2735 static void
2736 set_intel_mnemonic (int mnemonic_flag)
2737 {
2738   intel_mnemonic = mnemonic_flag;
2739 }
2740
2741 static void
2742 set_allow_index_reg (int flag)
2743 {
2744   allow_index_reg = flag;
2745 }
2746
2747 static void
2748 set_check (int what)
2749 {
2750   enum check_kind *kind;
2751   const char *str;
2752
2753   if (what)
2754     {
2755       kind = &operand_check;
2756       str = "operand";
2757     }
2758   else
2759     {
2760       kind = &sse_check;
2761       str = "sse";
2762     }
2763
2764   SKIP_WHITESPACE ();
2765
2766   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2767     {
2768       char *string;
2769       int e = get_symbol_name (&string);
2770
2771       if (strcmp (string, "none") == 0)
2772         *kind = check_none;
2773       else if (strcmp (string, "warning") == 0)
2774         *kind = check_warning;
2775       else if (strcmp (string, "error") == 0)
2776         *kind = check_error;
2777       else
2778         as_bad (_("bad argument to %s_check directive."), str);
2779       (void) restore_line_pointer (e);
2780     }
2781   else
2782     as_bad (_("missing argument for %s_check directive"), str);
2783
2784   demand_empty_rest_of_line ();
2785 }
2786
2787 static void
2788 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2789                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2790 {
2791 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2792   static const char *arch;
2793
2794   /* Intel LIOM is only supported on ELF.  */
2795   if (!IS_ELF)
2796     return;
2797
2798   if (!arch)
2799     {
2800       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2801          use default_arch.  */
2802       arch = cpu_arch_name;
2803       if (!arch)
2804         arch = default_arch;
2805     }
2806
2807   /* If we are targeting Intel MCU, we must enable it.  */
2808   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2809       || new_flag.bitfield.cpuiamcu)
2810     return;
2811
2812   /* If we are targeting Intel L1OM, we must enable it.  */
2813   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2814       || new_flag.bitfield.cpul1om)
2815     return;
2816
2817   /* If we are targeting Intel K1OM, we must enable it.  */
2818   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2819       || new_flag.bitfield.cpuk1om)
2820     return;
2821
2822   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2823 #endif
2824 }
2825
2826 static void
2827 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2828 {
2829   SKIP_WHITESPACE ();
2830
2831   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2832     {
2833       char *string;
2834       int e = get_symbol_name (&string);
2835       unsigned int j;
2836       i386_cpu_flags flags;
2837
2838       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2839         {
2840           if (strcmp (string, cpu_arch[j].name) == 0)
2841             {
2842               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2843
2844               if (*string != '.')
2845                 {
2846                   cpu_arch_name = cpu_arch[j].name;
2847                   cpu_sub_arch_name = NULL;
2848                   cpu_arch_flags = cpu_arch[j].flags;
2849                   if (flag_code == CODE_64BIT)
2850                     {
2851                       cpu_arch_flags.bitfield.cpu64 = 1;
2852                       cpu_arch_flags.bitfield.cpuno64 = 0;
2853                     }
2854                   else
2855                     {
2856                       cpu_arch_flags.bitfield.cpu64 = 0;
2857                       cpu_arch_flags.bitfield.cpuno64 = 1;
2858                     }
2859                   cpu_arch_isa = cpu_arch[j].type;
2860                   cpu_arch_isa_flags = cpu_arch[j].flags;
2861                   if (!cpu_arch_tune_set)
2862                     {
2863                       cpu_arch_tune = cpu_arch_isa;
2864                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2865                     }
2866                   break;
2867                 }
2868
2869               flags = cpu_flags_or (cpu_arch_flags,
2870                                     cpu_arch[j].flags);
2871
2872               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2873                 {
2874                   if (cpu_sub_arch_name)
2875                     {
2876                       char *name = cpu_sub_arch_name;
2877                       cpu_sub_arch_name = concat (name,
2878                                                   cpu_arch[j].name,
2879                                                   (const char *) NULL);
2880                       free (name);
2881                     }
2882                   else
2883                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2884                   cpu_arch_flags = flags;
2885                   cpu_arch_isa_flags = flags;
2886                 }
2887               else
2888                 cpu_arch_isa_flags
2889                   = cpu_flags_or (cpu_arch_isa_flags,
2890                                   cpu_arch[j].flags);
2891               (void) restore_line_pointer (e);
2892               demand_empty_rest_of_line ();
2893               return;
2894             }
2895         }
2896
2897       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2898         {
2899           /* Disable an ISA extension.  */
2900           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2901             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2902               {
2903                 flags = cpu_flags_and_not (cpu_arch_flags,
2904                                            cpu_noarch[j].flags);
2905                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2906                   {
2907                     if (cpu_sub_arch_name)
2908                       {
2909                         char *name = cpu_sub_arch_name;
2910                         cpu_sub_arch_name = concat (name, string,
2911                                                     (const char *) NULL);
2912                         free (name);
2913                       }
2914                     else
2915                       cpu_sub_arch_name = xstrdup (string);
2916                     cpu_arch_flags = flags;
2917                     cpu_arch_isa_flags = flags;
2918                   }
2919                 (void) restore_line_pointer (e);
2920                 demand_empty_rest_of_line ();
2921                 return;
2922               }
2923
2924           j = ARRAY_SIZE (cpu_arch);
2925         }
2926
2927       if (j >= ARRAY_SIZE (cpu_arch))
2928         as_bad (_("no such architecture: `%s'"), string);
2929
2930       *input_line_pointer = e;
2931     }
2932   else
2933     as_bad (_("missing cpu architecture"));
2934
2935   no_cond_jump_promotion = 0;
2936   if (*input_line_pointer == ','
2937       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2938     {
2939       char *string;
2940       char e;
2941
2942       ++input_line_pointer;
2943       e = get_symbol_name (&string);
2944
2945       if (strcmp (string, "nojumps") == 0)
2946         no_cond_jump_promotion = 1;
2947       else if (strcmp (string, "jumps") == 0)
2948         ;
2949       else
2950         as_bad (_("no such architecture modifier: `%s'"), string);
2951
2952       (void) restore_line_pointer (e);
2953     }
2954
2955   demand_empty_rest_of_line ();
2956 }
2957
2958 enum bfd_architecture
2959 i386_arch (void)
2960 {
2961   if (cpu_arch_isa == PROCESSOR_L1OM)
2962     {
2963       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2964           || flag_code != CODE_64BIT)
2965         as_fatal (_("Intel L1OM is 64bit ELF only"));
2966       return bfd_arch_l1om;
2967     }
2968   else if (cpu_arch_isa == PROCESSOR_K1OM)
2969     {
2970       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2971           || flag_code != CODE_64BIT)
2972         as_fatal (_("Intel K1OM is 64bit ELF only"));
2973       return bfd_arch_k1om;
2974     }
2975   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2976     {
2977       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2978           || flag_code == CODE_64BIT)
2979         as_fatal (_("Intel MCU is 32bit ELF only"));
2980       return bfd_arch_iamcu;
2981     }
2982   else
2983     return bfd_arch_i386;
2984 }
2985
2986 unsigned long
2987 i386_mach (void)
2988 {
2989   if (!strncmp (default_arch, "x86_64", 6))
2990     {
2991       if (cpu_arch_isa == PROCESSOR_L1OM)
2992         {
2993           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2994               || default_arch[6] != '\0')
2995             as_fatal (_("Intel L1OM is 64bit ELF only"));
2996           return bfd_mach_l1om;
2997         }
2998       else if (cpu_arch_isa == PROCESSOR_K1OM)
2999         {
3000           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3001               || default_arch[6] != '\0')
3002             as_fatal (_("Intel K1OM is 64bit ELF only"));
3003           return bfd_mach_k1om;
3004         }
3005       else if (default_arch[6] == '\0')
3006         return bfd_mach_x86_64;
3007       else
3008         return bfd_mach_x64_32;
3009     }
3010   else if (!strcmp (default_arch, "i386")
3011            || !strcmp (default_arch, "iamcu"))
3012     {
3013       if (cpu_arch_isa == PROCESSOR_IAMCU)
3014         {
3015           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3016             as_fatal (_("Intel MCU is 32bit ELF only"));
3017           return bfd_mach_i386_iamcu;
3018         }
3019       else
3020         return bfd_mach_i386_i386;
3021     }
3022   else
3023     as_fatal (_("unknown architecture"));
3024 }
3025 \f
3026 void
3027 md_begin (void)
3028 {
3029   /* Support pseudo prefixes like {disp32}.  */
3030   lex_type ['{'] = LEX_BEGIN_NAME;
3031
3032   /* Initialize op_hash hash table.  */
3033   op_hash = str_htab_create ();
3034
3035   {
3036     const insn_template *optab;
3037     templates *core_optab;
3038
3039     /* Setup for loop.  */
3040     optab = i386_optab;
3041     core_optab = XNEW (templates);
3042     core_optab->start = optab;
3043
3044     while (1)
3045       {
3046         ++optab;
3047         if (optab->name == NULL
3048             || strcmp (optab->name, (optab - 1)->name) != 0)
3049           {
3050             /* different name --> ship out current template list;
3051                add to hash table; & begin anew.  */
3052             core_optab->end = optab;
3053             if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3054               as_fatal (_("duplicate %s"), (optab - 1)->name);
3055
3056             if (optab->name == NULL)
3057               break;
3058             core_optab = XNEW (templates);
3059             core_optab->start = optab;
3060           }
3061       }
3062   }
3063
3064   /* Initialize reg_hash hash table.  */
3065   reg_hash = str_htab_create ();
3066   {
3067     const reg_entry *regtab;
3068     unsigned int regtab_size = i386_regtab_size;
3069
3070     for (regtab = i386_regtab; regtab_size--; regtab++)
3071       if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3072         as_fatal (_("duplicate %s"), regtab->reg_name);
3073   }
3074
3075   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3076   {
3077     int c;
3078     char *p;
3079
3080     for (c = 0; c < 256; c++)
3081       {
3082         if (ISDIGIT (c))
3083           {
3084             digit_chars[c] = c;
3085             mnemonic_chars[c] = c;
3086             register_chars[c] = c;
3087             operand_chars[c] = c;
3088           }
3089         else if (ISLOWER (c))
3090           {
3091             mnemonic_chars[c] = c;
3092             register_chars[c] = c;
3093             operand_chars[c] = c;
3094           }
3095         else if (ISUPPER (c))
3096           {
3097             mnemonic_chars[c] = TOLOWER (c);
3098             register_chars[c] = mnemonic_chars[c];
3099             operand_chars[c] = c;
3100           }
3101         else if (c == '{' || c == '}')
3102           {
3103             mnemonic_chars[c] = c;
3104             operand_chars[c] = c;
3105           }
3106 #ifdef SVR4_COMMENT_CHARS
3107         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3108           operand_chars[c] = c;
3109 #endif
3110
3111         if (ISALPHA (c) || ISDIGIT (c))
3112           identifier_chars[c] = c;
3113         else if (c >= 128)
3114           {
3115             identifier_chars[c] = c;
3116             operand_chars[c] = c;
3117           }
3118       }
3119
3120 #ifdef LEX_AT
3121     identifier_chars['@'] = '@';
3122 #endif
3123 #ifdef LEX_QM
3124     identifier_chars['?'] = '?';
3125     operand_chars['?'] = '?';
3126 #endif
3127     digit_chars['-'] = '-';
3128     mnemonic_chars['_'] = '_';
3129     mnemonic_chars['-'] = '-';
3130     mnemonic_chars['.'] = '.';
3131     identifier_chars['_'] = '_';
3132     identifier_chars['.'] = '.';
3133
3134     for (p = operand_special_chars; *p != '\0'; p++)
3135       operand_chars[(unsigned char) *p] = *p;
3136   }
3137
3138   if (flag_code == CODE_64BIT)
3139     {
3140 #if defined (OBJ_COFF) && defined (TE_PE)
3141       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3142                                   ? 32 : 16);
3143 #else
3144       x86_dwarf2_return_column = 16;
3145 #endif
3146       x86_cie_data_alignment = -8;
3147     }
3148   else
3149     {
3150       x86_dwarf2_return_column = 8;
3151       x86_cie_data_alignment = -4;
3152     }
3153
3154   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3155      can be turned into BRANCH_PREFIX frag.  */
3156   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3157     abort ();
3158 }
3159
3160 void
3161 i386_print_statistics (FILE *file)
3162 {
3163   htab_print_statistics (file, "i386 opcode", op_hash);
3164   htab_print_statistics (file, "i386 register", reg_hash);
3165 }
3166 \f
3167 #ifdef DEBUG386
3168
3169 /* Debugging routines for md_assemble.  */
3170 static void pte (insn_template *);
3171 static void pt (i386_operand_type);
3172 static void pe (expressionS *);
3173 static void ps (symbolS *);
3174
3175 static void
3176 pi (const char *line, i386_insn *x)
3177 {
3178   unsigned int j;
3179
3180   fprintf (stdout, "%s: template ", line);
3181   pte (&x->tm);
3182   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3183            x->base_reg ? x->base_reg->reg_name : "none",
3184            x->index_reg ? x->index_reg->reg_name : "none",
3185            x->log2_scale_factor);
3186   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3187            x->rm.mode, x->rm.reg, x->rm.regmem);
3188   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3189            x->sib.base, x->sib.index, x->sib.scale);
3190   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3191            (x->rex & REX_W) != 0,
3192            (x->rex & REX_R) != 0,
3193            (x->rex & REX_X) != 0,
3194            (x->rex & REX_B) != 0);
3195   for (j = 0; j < x->operands; j++)
3196     {
3197       fprintf (stdout, "    #%d:  ", j + 1);
3198       pt (x->types[j]);
3199       fprintf (stdout, "\n");
3200       if (x->types[j].bitfield.class == Reg
3201           || x->types[j].bitfield.class == RegMMX
3202           || x->types[j].bitfield.class == RegSIMD
3203           || x->types[j].bitfield.class == RegMask
3204           || x->types[j].bitfield.class == SReg
3205           || x->types[j].bitfield.class == RegCR
3206           || x->types[j].bitfield.class == RegDR
3207           || x->types[j].bitfield.class == RegTR
3208           || x->types[j].bitfield.class == RegBND)
3209         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3210       if (operand_type_check (x->types[j], imm))
3211         pe (x->op[j].imms);
3212       if (operand_type_check (x->types[j], disp))
3213         pe (x->op[j].disps);
3214     }
3215 }
3216
3217 static void
3218 pte (insn_template *t)
3219 {
3220   unsigned int j;
3221   fprintf (stdout, " %d operands ", t->operands);
3222   fprintf (stdout, "opcode %x ", t->base_opcode);
3223   if (t->extension_opcode != None)
3224     fprintf (stdout, "ext %x ", t->extension_opcode);
3225   if (t->opcode_modifier.d)
3226     fprintf (stdout, "D");
3227   if (t->opcode_modifier.w)
3228     fprintf (stdout, "W");
3229   fprintf (stdout, "\n");
3230   for (j = 0; j < t->operands; j++)
3231     {
3232       fprintf (stdout, "    #%d type ", j + 1);
3233       pt (t->operand_types[j]);
3234       fprintf (stdout, "\n");
3235     }
3236 }
3237
3238 static void
3239 pe (expressionS *e)
3240 {
3241   fprintf (stdout, "    operation     %d\n", e->X_op);
3242   fprintf (stdout, "    add_number    %ld (%lx)\n",
3243            (long) e->X_add_number, (long) e->X_add_number);
3244   if (e->X_add_symbol)
3245     {
3246       fprintf (stdout, "    add_symbol    ");
3247       ps (e->X_add_symbol);
3248       fprintf (stdout, "\n");
3249     }
3250   if (e->X_op_symbol)
3251     {
3252       fprintf (stdout, "    op_symbol    ");
3253       ps (e->X_op_symbol);
3254       fprintf (stdout, "\n");
3255     }
3256 }
3257
3258 static void
3259 ps (symbolS *s)
3260 {
3261   fprintf (stdout, "%s type %s%s",
3262            S_GET_NAME (s),
3263            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3264            segment_name (S_GET_SEGMENT (s)));
3265 }
3266
3267 static struct type_name
3268   {
3269     i386_operand_type mask;
3270     const char *name;
3271   }
3272 const type_names[] =
3273 {
3274   { OPERAND_TYPE_REG8, "r8" },
3275   { OPERAND_TYPE_REG16, "r16" },
3276   { OPERAND_TYPE_REG32, "r32" },
3277   { OPERAND_TYPE_REG64, "r64" },
3278   { OPERAND_TYPE_ACC8, "acc8" },
3279   { OPERAND_TYPE_ACC16, "acc16" },
3280   { OPERAND_TYPE_ACC32, "acc32" },
3281   { OPERAND_TYPE_ACC64, "acc64" },
3282   { OPERAND_TYPE_IMM8, "i8" },
3283   { OPERAND_TYPE_IMM8, "i8s" },
3284   { OPERAND_TYPE_IMM16, "i16" },
3285   { OPERAND_TYPE_IMM32, "i32" },
3286   { OPERAND_TYPE_IMM32S, "i32s" },
3287   { OPERAND_TYPE_IMM64, "i64" },
3288   { OPERAND_TYPE_IMM1, "i1" },
3289   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3290   { OPERAND_TYPE_DISP8, "d8" },
3291   { OPERAND_TYPE_DISP16, "d16" },
3292   { OPERAND_TYPE_DISP32, "d32" },
3293   { OPERAND_TYPE_DISP32S, "d32s" },
3294   { OPERAND_TYPE_DISP64, "d64" },
3295   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3296   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3297   { OPERAND_TYPE_CONTROL, "control reg" },
3298   { OPERAND_TYPE_TEST, "test reg" },
3299   { OPERAND_TYPE_DEBUG, "debug reg" },
3300   { OPERAND_TYPE_FLOATREG, "FReg" },
3301   { OPERAND_TYPE_FLOATACC, "FAcc" },
3302   { OPERAND_TYPE_SREG, "SReg" },
3303   { OPERAND_TYPE_REGMMX, "rMMX" },
3304   { OPERAND_TYPE_REGXMM, "rXMM" },
3305   { OPERAND_TYPE_REGYMM, "rYMM" },
3306   { OPERAND_TYPE_REGZMM, "rZMM" },
3307   { OPERAND_TYPE_REGTMM, "rTMM" },
3308   { OPERAND_TYPE_REGMASK, "Mask reg" },
3309 };
3310
3311 static void
3312 pt (i386_operand_type t)
3313 {
3314   unsigned int j;
3315   i386_operand_type a;
3316
3317   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3318     {
3319       a = operand_type_and (t, type_names[j].mask);
3320       if (operand_type_equal (&a, &type_names[j].mask))
3321         fprintf (stdout, "%s, ",  type_names[j].name);
3322     }
3323   fflush (stdout);
3324 }
3325
3326 #endif /* DEBUG386 */
3327 \f
3328 static bfd_reloc_code_real_type
3329 reloc (unsigned int size,
3330        int pcrel,
3331        int sign,
3332        bfd_reloc_code_real_type other)
3333 {
3334   if (other != NO_RELOC)
3335     {
3336       reloc_howto_type *rel;
3337
3338       if (size == 8)
3339         switch (other)
3340           {
3341           case BFD_RELOC_X86_64_GOT32:
3342             return BFD_RELOC_X86_64_GOT64;
3343             break;
3344           case BFD_RELOC_X86_64_GOTPLT64:
3345             return BFD_RELOC_X86_64_GOTPLT64;
3346             break;
3347           case BFD_RELOC_X86_64_PLTOFF64:
3348             return BFD_RELOC_X86_64_PLTOFF64;
3349             break;
3350           case BFD_RELOC_X86_64_GOTPC32:
3351             other = BFD_RELOC_X86_64_GOTPC64;
3352             break;
3353           case BFD_RELOC_X86_64_GOTPCREL:
3354             other = BFD_RELOC_X86_64_GOTPCREL64;
3355             break;
3356           case BFD_RELOC_X86_64_TPOFF32:
3357             other = BFD_RELOC_X86_64_TPOFF64;
3358             break;
3359           case BFD_RELOC_X86_64_DTPOFF32:
3360             other = BFD_RELOC_X86_64_DTPOFF64;
3361             break;
3362           default:
3363             break;
3364           }
3365
3366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3367       if (other == BFD_RELOC_SIZE32)
3368         {
3369           if (size == 8)
3370             other = BFD_RELOC_SIZE64;
3371           if (pcrel)
3372             {
3373               as_bad (_("there are no pc-relative size relocations"));
3374               return NO_RELOC;
3375             }
3376         }
3377 #endif
3378
3379       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3380       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3381         sign = -1;
3382
3383       rel = bfd_reloc_type_lookup (stdoutput, other);
3384       if (!rel)
3385         as_bad (_("unknown relocation (%u)"), other);
3386       else if (size != bfd_get_reloc_size (rel))
3387         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3388                 bfd_get_reloc_size (rel),
3389                 size);
3390       else if (pcrel && !rel->pc_relative)
3391         as_bad (_("non-pc-relative relocation for pc-relative field"));
3392       else if ((rel->complain_on_overflow == complain_overflow_signed
3393                 && !sign)
3394                || (rel->complain_on_overflow == complain_overflow_unsigned
3395                    && sign > 0))
3396         as_bad (_("relocated field and relocation type differ in signedness"));
3397       else
3398         return other;
3399       return NO_RELOC;
3400     }
3401
3402   if (pcrel)
3403     {
3404       if (!sign)
3405         as_bad (_("there are no unsigned pc-relative relocations"));
3406       switch (size)
3407         {
3408         case 1: return BFD_RELOC_8_PCREL;
3409         case 2: return BFD_RELOC_16_PCREL;
3410         case 4: return BFD_RELOC_32_PCREL;
3411         case 8: return BFD_RELOC_64_PCREL;
3412         }
3413       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3414     }
3415   else
3416     {
3417       if (sign > 0)
3418         switch (size)
3419           {
3420           case 4: return BFD_RELOC_X86_64_32S;
3421           }
3422       else
3423         switch (size)
3424           {
3425           case 1: return BFD_RELOC_8;
3426           case 2: return BFD_RELOC_16;
3427           case 4: return BFD_RELOC_32;
3428           case 8: return BFD_RELOC_64;
3429           }
3430       as_bad (_("cannot do %s %u byte relocation"),
3431               sign > 0 ? "signed" : "unsigned", size);
3432     }
3433
3434   return NO_RELOC;
3435 }
3436
3437 /* Here we decide which fixups can be adjusted to make them relative to
3438    the beginning of the section instead of the symbol.  Basically we need
3439    to make sure that the dynamic relocations are done correctly, so in
3440    some cases we force the original symbol to be used.  */
3441
3442 int
3443 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3444 {
3445 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3446   if (!IS_ELF)
3447     return 1;
3448
3449   /* Don't adjust pc-relative references to merge sections in 64-bit
3450      mode.  */
3451   if (use_rela_relocations
3452       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453       && fixP->fx_pcrel)
3454     return 0;
3455
3456   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457      and changed later by validate_fix.  */
3458   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460     return 0;
3461
3462   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3463      for size relocations.  */
3464   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465       || fixP->fx_r_type == BFD_RELOC_SIZE64
3466       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3467       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3468       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3469       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3473       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3475       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3477       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3479       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3480       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3481       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3483       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3486       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3487       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3489       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3491       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3493       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495     return 0;
3496 #endif
3497   return 1;
3498 }
3499
3500 static int
3501 intel_float_operand (const char *mnemonic)
3502 {
3503   /* Note that the value returned is meaningful only for opcodes with (memory)
3504      operands, hence the code here is free to improperly handle opcodes that
3505      have no operands (for better performance and smaller code). */
3506
3507   if (mnemonic[0] != 'f')
3508     return 0; /* non-math */
3509
3510   switch (mnemonic[1])
3511     {
3512     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513        the fs segment override prefix not currently handled because no
3514        call path can make opcodes without operands get here */
3515     case 'i':
3516       return 2 /* integer op */;
3517     case 'l':
3518       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519         return 3; /* fldcw/fldenv */
3520       break;
3521     case 'n':
3522       if (mnemonic[2] != 'o' /* fnop */)
3523         return 3; /* non-waiting control op */
3524       break;
3525     case 'r':
3526       if (mnemonic[2] == 's')
3527         return 3; /* frstor/frstpm */
3528       break;
3529     case 's':
3530       if (mnemonic[2] == 'a')
3531         return 3; /* fsave */
3532       if (mnemonic[2] == 't')
3533         {
3534           switch (mnemonic[3])
3535             {
3536             case 'c': /* fstcw */
3537             case 'd': /* fstdw */
3538             case 'e': /* fstenv */
3539             case 's': /* fsts[gw] */
3540               return 3;
3541             }
3542         }
3543       break;
3544     case 'x':
3545       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546         return 0; /* fxsave/fxrstor are not really math ops */
3547       break;
3548     }
3549
3550   return 1;
3551 }
3552
3553 /* Build the VEX prefix.  */
3554
3555 static void
3556 build_vex_prefix (const insn_template *t)
3557 {
3558   unsigned int register_specifier;
3559   unsigned int implied_prefix;
3560   unsigned int vector_length;
3561   unsigned int w;
3562
3563   /* Check register specifier.  */
3564   if (i.vex.register_specifier)
3565     {
3566       register_specifier =
3567         ~register_number (i.vex.register_specifier) & 0xf;
3568       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569     }
3570   else
3571     register_specifier = 0xf;
3572
3573   /* Use 2-byte VEX prefix by swapping destination and source operand
3574      if there are more than 1 register operand.  */
3575   if (i.reg_operands > 1
3576       && i.vec_encoding != vex_encoding_vex3
3577       && i.dir_encoding == dir_encoding_default
3578       && i.operands == i.reg_operands
3579       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3580       && i.tm.opcode_modifier.vexopcode == VEX0F
3581       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3582       && i.rex == REX_B)
3583     {
3584       unsigned int xchg = i.operands - 1;
3585       union i386_op temp_op;
3586       i386_operand_type temp_type;
3587
3588       temp_type = i.types[xchg];
3589       i.types[xchg] = i.types[0];
3590       i.types[0] = temp_type;
3591       temp_op = i.op[xchg];
3592       i.op[xchg] = i.op[0];
3593       i.op[0] = temp_op;
3594
3595       gas_assert (i.rm.mode == 3);
3596
3597       i.rex = REX_R;
3598       xchg = i.rm.regmem;
3599       i.rm.regmem = i.rm.reg;
3600       i.rm.reg = xchg;
3601
3602       if (i.tm.opcode_modifier.d)
3603         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605       else /* Use the next insn.  */
3606         i.tm = t[1];
3607     }
3608
3609   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610      are no memory operands and at least 3 register ones.  */
3611   if (i.reg_operands >= 3
3612       && i.vec_encoding != vex_encoding_vex3
3613       && i.reg_operands == i.operands - i.imm_operands
3614       && i.tm.opcode_modifier.vex
3615       && i.tm.opcode_modifier.commutative
3616       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617       && i.rex == REX_B
3618       && i.vex.register_specifier
3619       && !(i.vex.register_specifier->reg_flags & RegRex))
3620     {
3621       unsigned int xchg = i.operands - i.reg_operands;
3622       union i386_op temp_op;
3623       i386_operand_type temp_type;
3624
3625       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626       gas_assert (!i.tm.opcode_modifier.sae);
3627       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628                                       &i.types[i.operands - 3]));
3629       gas_assert (i.rm.mode == 3);
3630
3631       temp_type = i.types[xchg];
3632       i.types[xchg] = i.types[xchg + 1];
3633       i.types[xchg + 1] = temp_type;
3634       temp_op = i.op[xchg];
3635       i.op[xchg] = i.op[xchg + 1];
3636       i.op[xchg + 1] = temp_op;
3637
3638       i.rex = 0;
3639       xchg = i.rm.regmem | 8;
3640       i.rm.regmem = ~register_specifier & 0xf;
3641       gas_assert (!(i.rm.regmem & 8));
3642       i.vex.register_specifier += xchg - i.rm.regmem;
3643       register_specifier = ~xchg & 0xf;
3644     }
3645
3646   if (i.tm.opcode_modifier.vex == VEXScalar)
3647     vector_length = avxscalar;
3648   else if (i.tm.opcode_modifier.vex == VEX256)
3649     vector_length = 1;
3650   else
3651     {
3652       unsigned int op;
3653
3654       /* Determine vector length from the last multi-length vector
3655          operand.  */
3656       vector_length = 0;
3657       for (op = t->operands; op--;)
3658         if (t->operand_types[op].bitfield.xmmword
3659             && t->operand_types[op].bitfield.ymmword
3660             && i.types[op].bitfield.ymmword)
3661           {
3662             vector_length = 1;
3663             break;
3664           }
3665     }
3666
3667   switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
3668     {
3669     case 0:
3670       implied_prefix = 0;
3671       break;
3672     case DATA_PREFIX_OPCODE:
3673       implied_prefix = 1;
3674       break;
3675     case REPE_PREFIX_OPCODE:
3676       implied_prefix = 2;
3677       break;
3678     case REPNE_PREFIX_OPCODE:
3679       implied_prefix = 3;
3680       break;
3681     default:
3682       abort ();
3683     }
3684
3685   /* Check the REX.W bit and VEXW.  */
3686   if (i.tm.opcode_modifier.vexw == VEXWIG)
3687     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688   else if (i.tm.opcode_modifier.vexw)
3689     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690   else
3691     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3692
3693   /* Use 2-byte VEX prefix if possible.  */
3694   if (w == 0
3695       && i.vec_encoding != vex_encoding_vex3
3696       && i.tm.opcode_modifier.vexopcode == VEX0F
3697       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698     {
3699       /* 2-byte VEX prefix.  */
3700       unsigned int r;
3701
3702       i.vex.length = 2;
3703       i.vex.bytes[0] = 0xc5;
3704
3705       /* Check the REX.R bit.  */
3706       r = (i.rex & REX_R) ? 0 : 1;
3707       i.vex.bytes[1] = (r << 7
3708                         | register_specifier << 3
3709                         | vector_length << 2
3710                         | implied_prefix);
3711     }
3712   else
3713     {
3714       /* 3-byte VEX prefix.  */
3715       unsigned int m;
3716
3717       i.vex.length = 3;
3718
3719       switch (i.tm.opcode_modifier.vexopcode)
3720         {
3721         case VEX0F:
3722           m = 0x1;
3723           i.vex.bytes[0] = 0xc4;
3724           break;
3725         case VEX0F38:
3726           m = 0x2;
3727           i.vex.bytes[0] = 0xc4;
3728           break;
3729         case VEX0F3A:
3730           m = 0x3;
3731           i.vex.bytes[0] = 0xc4;
3732           break;
3733         case XOP08:
3734           m = 0x8;
3735           i.vex.bytes[0] = 0x8f;
3736           break;
3737         case XOP09:
3738           m = 0x9;
3739           i.vex.bytes[0] = 0x8f;
3740           break;
3741         case XOP0A:
3742           m = 0xa;
3743           i.vex.bytes[0] = 0x8f;
3744           break;
3745         default:
3746           abort ();
3747         }
3748
3749       /* The high 3 bits of the second VEX byte are 1's compliment
3750          of RXB bits from REX.  */
3751       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
3753       i.vex.bytes[2] = (w << 7
3754                         | register_specifier << 3
3755                         | vector_length << 2
3756                         | implied_prefix);
3757     }
3758 }
3759
3760 static INLINE bfd_boolean
3761 is_evex_encoding (const insn_template *t)
3762 {
3763   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3764          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3765          || t->opcode_modifier.sae;
3766 }
3767
3768 static INLINE bfd_boolean
3769 is_any_vex_encoding (const insn_template *t)
3770 {
3771   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772          || is_evex_encoding (t);
3773 }
3774
3775 /* Build the EVEX prefix.  */
3776
3777 static void
3778 build_evex_prefix (void)
3779 {
3780   unsigned int register_specifier;
3781   unsigned int implied_prefix;
3782   unsigned int m, w;
3783   rex_byte vrex_used = 0;
3784
3785   /* Check register specifier.  */
3786   if (i.vex.register_specifier)
3787     {
3788       gas_assert ((i.vrex & REX_X) == 0);
3789
3790       register_specifier = i.vex.register_specifier->reg_num;
3791       if ((i.vex.register_specifier->reg_flags & RegRex))
3792         register_specifier += 8;
3793       /* The upper 16 registers are encoded in the fourth byte of the
3794          EVEX prefix.  */
3795       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796         i.vex.bytes[3] = 0x8;
3797       register_specifier = ~register_specifier & 0xf;
3798     }
3799   else
3800     {
3801       register_specifier = 0xf;
3802
3803       /* Encode upper 16 vector index register in the fourth byte of
3804          the EVEX prefix.  */
3805       if (!(i.vrex & REX_X))
3806         i.vex.bytes[3] = 0x8;
3807       else
3808         vrex_used |= REX_X;
3809     }
3810
3811   switch ((i.tm.base_opcode >> 8) & 0xff)
3812     {
3813     case 0:
3814       implied_prefix = 0;
3815       break;
3816     case DATA_PREFIX_OPCODE:
3817       implied_prefix = 1;
3818       break;
3819     case REPE_PREFIX_OPCODE:
3820       implied_prefix = 2;
3821       break;
3822     case REPNE_PREFIX_OPCODE:
3823       implied_prefix = 3;
3824       break;
3825     default:
3826       abort ();
3827     }
3828
3829   /* 4 byte EVEX prefix.  */
3830   i.vex.length = 4;
3831   i.vex.bytes[0] = 0x62;
3832
3833   /* mmmm bits.  */
3834   switch (i.tm.opcode_modifier.vexopcode)
3835     {
3836     case VEX0F:
3837       m = 1;
3838       break;
3839     case VEX0F38:
3840       m = 2;
3841       break;
3842     case VEX0F3A:
3843       m = 3;
3844       break;
3845     default:
3846       abort ();
3847       break;
3848     }
3849
3850   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851      bits from REX.  */
3852   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854   /* The fifth bit of the second EVEX byte is 1's compliment of the
3855      REX_R bit in VREX.  */
3856   if (!(i.vrex & REX_R))
3857     i.vex.bytes[1] |= 0x10;
3858   else
3859     vrex_used |= REX_R;
3860
3861   if ((i.reg_operands + i.imm_operands) == i.operands)
3862     {
3863       /* When all operands are registers, the REX_X bit in REX is not
3864          used.  We reuse it to encode the upper 16 registers, which is
3865          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3866          as 1's compliment.  */
3867       if ((i.vrex & REX_B))
3868         {
3869           vrex_used |= REX_B;
3870           i.vex.bytes[1] &= ~0x40;
3871         }
3872     }
3873
3874   /* EVEX instructions shouldn't need the REX prefix.  */
3875   i.vrex &= ~vrex_used;
3876   gas_assert (i.vrex == 0);
3877
3878   /* Check the REX.W bit and VEXW.  */
3879   if (i.tm.opcode_modifier.vexw == VEXWIG)
3880     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881   else if (i.tm.opcode_modifier.vexw)
3882     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883   else
3884     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3885
3886   /* Encode the U bit.  */
3887   implied_prefix |= 0x4;
3888
3889   /* The third byte of the EVEX prefix.  */
3890   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892   /* The fourth byte of the EVEX prefix.  */
3893   /* The zeroing-masking bit.  */
3894   if (i.mask && i.mask->zeroing)
3895     i.vex.bytes[3] |= 0x80;
3896
3897   /* Don't always set the broadcast bit if there is no RC.  */
3898   if (!i.rounding)
3899     {
3900       /* Encode the vector length.  */
3901       unsigned int vec_length;
3902
3903       if (!i.tm.opcode_modifier.evex
3904           || i.tm.opcode_modifier.evex == EVEXDYN)
3905         {
3906           unsigned int op;
3907
3908           /* Determine vector length from the last multi-length vector
3909              operand.  */
3910           for (op = i.operands; op--;)
3911             if (i.tm.operand_types[op].bitfield.xmmword
3912                 + i.tm.operand_types[op].bitfield.ymmword
3913                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914               {
3915                 if (i.types[op].bitfield.zmmword)
3916                   {
3917                     i.tm.opcode_modifier.evex = EVEX512;
3918                     break;
3919                   }
3920                 else if (i.types[op].bitfield.ymmword)
3921                   {
3922                     i.tm.opcode_modifier.evex = EVEX256;
3923                     break;
3924                   }
3925                 else if (i.types[op].bitfield.xmmword)
3926                   {
3927                     i.tm.opcode_modifier.evex = EVEX128;
3928                     break;
3929                   }
3930                 else if (i.broadcast && (int) op == i.broadcast->operand)
3931                   {
3932                     switch (i.broadcast->bytes)
3933                       {
3934                         case 64:
3935                           i.tm.opcode_modifier.evex = EVEX512;
3936                           break;
3937                         case 32:
3938                           i.tm.opcode_modifier.evex = EVEX256;
3939                           break;
3940                         case 16:
3941                           i.tm.opcode_modifier.evex = EVEX128;
3942                           break;
3943                         default:
3944                           abort ();
3945                       }
3946                     break;
3947                   }
3948               }
3949
3950           if (op >= MAX_OPERANDS)
3951             abort ();
3952         }
3953
3954       switch (i.tm.opcode_modifier.evex)
3955         {
3956         case EVEXLIG: /* LL' is ignored */
3957           vec_length = evexlig << 5;
3958           break;
3959         case EVEX128:
3960           vec_length = 0 << 5;
3961           break;
3962         case EVEX256:
3963           vec_length = 1 << 5;
3964           break;
3965         case EVEX512:
3966           vec_length = 2 << 5;
3967           break;
3968         default:
3969           abort ();
3970           break;
3971         }
3972       i.vex.bytes[3] |= vec_length;
3973       /* Encode the broadcast bit.  */
3974       if (i.broadcast)
3975         i.vex.bytes[3] |= 0x10;
3976     }
3977   else
3978     {
3979       if (i.rounding->type != saeonly)
3980         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981       else
3982         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3983     }
3984
3985   if (i.mask && i.mask->mask)
3986     i.vex.bytes[3] |= i.mask->mask->reg_num;
3987 }
3988
3989 static void
3990 process_immext (void)
3991 {
3992   expressionS *exp;
3993
3994   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3995      which is coded in the same place as an 8-bit immediate field
3996      would be.  Here we fake an 8-bit immediate operand from the
3997      opcode suffix stored in tm.extension_opcode.
3998
3999      AVX instructions also use this encoding, for some of
4000      3 argument instructions.  */
4001
4002   gas_assert (i.imm_operands <= 1
4003               && (i.operands <= 2
4004                   || (is_any_vex_encoding (&i.tm)
4005                       && i.operands <= 4)));
4006
4007   exp = &im_expressions[i.imm_operands++];
4008   i.op[i.operands].imms = exp;
4009   i.types[i.operands] = imm8;
4010   i.operands++;
4011   exp->X_op = O_constant;
4012   exp->X_add_number = i.tm.extension_opcode;
4013   i.tm.extension_opcode = None;
4014 }
4015
4016
4017 static int
4018 check_hle (void)
4019 {
4020   switch (i.tm.opcode_modifier.hleprefixok)
4021     {
4022     default:
4023       abort ();
4024     case HLEPrefixNone:
4025       as_bad (_("invalid instruction `%s' after `%s'"),
4026               i.tm.name, i.hle_prefix);
4027       return 0;
4028     case HLEPrefixLock:
4029       if (i.prefix[LOCK_PREFIX])
4030         return 1;
4031       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4032       return 0;
4033     case HLEPrefixAny:
4034       return 1;
4035     case HLEPrefixRelease:
4036       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037         {
4038           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039                   i.tm.name);
4040           return 0;
4041         }
4042       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4043         {
4044           as_bad (_("memory destination needed for instruction `%s'"
4045                     " after `xrelease'"), i.tm.name);
4046           return 0;
4047         }
4048       return 1;
4049     }
4050 }
4051
4052 /* Try the shortest encoding by shortening operand size.  */
4053
4054 static void
4055 optimize_encoding (void)
4056 {
4057   unsigned int j;
4058
4059   if (optimize_for_space
4060       && !is_any_vex_encoding (&i.tm)
4061       && i.reg_operands == 1
4062       && i.imm_operands == 1
4063       && !i.types[1].bitfield.byte
4064       && i.op[0].imms->X_op == O_constant
4065       && fits_in_imm7 (i.op[0].imms->X_add_number)
4066       && (i.tm.base_opcode == 0xa8
4067           || (i.tm.base_opcode == 0xf6
4068               && i.tm.extension_opcode == 0x0)))
4069     {
4070       /* Optimize: -Os:
4071            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4072        */
4073       unsigned int base_regnum = i.op[1].regs->reg_num;
4074       if (flag_code == CODE_64BIT || base_regnum < 4)
4075         {
4076           i.types[1].bitfield.byte = 1;
4077           /* Ignore the suffix.  */
4078           i.suffix = 0;
4079           /* Convert to byte registers.  */
4080           if (i.types[1].bitfield.word)
4081             j = 16;
4082           else if (i.types[1].bitfield.dword)
4083             j = 32;
4084           else
4085             j = 48;
4086           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087             j += 8;
4088           i.op[1].regs -= j;
4089         }
4090     }
4091   else if (flag_code == CODE_64BIT
4092            && !is_any_vex_encoding (&i.tm)
4093            && ((i.types[1].bitfield.qword
4094                 && i.reg_operands == 1
4095                 && i.imm_operands == 1
4096                 && i.op[0].imms->X_op == O_constant
4097                 && ((i.tm.base_opcode == 0xb8
4098                      && i.tm.extension_opcode == None
4099                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4101                         && ((i.tm.base_opcode == 0x24
4102                              || i.tm.base_opcode == 0xa8)
4103                             || (i.tm.base_opcode == 0x80
4104                                 && i.tm.extension_opcode == 0x4)
4105                             || ((i.tm.base_opcode == 0xf6
4106                                  || (i.tm.base_opcode | 1) == 0xc7)
4107                                 && i.tm.extension_opcode == 0x0)))
4108                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109                         && i.tm.base_opcode == 0x83
4110                         && i.tm.extension_opcode == 0x4)))
4111                || (i.types[0].bitfield.qword
4112                    && ((i.reg_operands == 2
4113                         && i.op[0].regs == i.op[1].regs
4114                         && (i.tm.base_opcode == 0x30
4115                             || i.tm.base_opcode == 0x28))
4116                        || (i.reg_operands == 1
4117                            && i.operands == 1
4118                            && i.tm.base_opcode == 0x30)))))
4119     {
4120       /* Optimize: -O:
4121            andq $imm31, %r64   -> andl $imm31, %r32
4122            andq $imm7, %r64    -> andl $imm7, %r32
4123            testq $imm31, %r64  -> testl $imm31, %r32
4124            xorq %r64, %r64     -> xorl %r32, %r32
4125            subq %r64, %r64     -> subl %r32, %r32
4126            movq $imm31, %r64   -> movl $imm31, %r32
4127            movq $imm32, %r64   -> movl $imm32, %r32
4128         */
4129       i.tm.opcode_modifier.norex64 = 1;
4130       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4131         {
4132           /* Handle
4133                movq $imm31, %r64   -> movl $imm31, %r32
4134                movq $imm32, %r64   -> movl $imm32, %r32
4135            */
4136           i.tm.operand_types[0].bitfield.imm32 = 1;
4137           i.tm.operand_types[0].bitfield.imm32s = 0;
4138           i.tm.operand_types[0].bitfield.imm64 = 0;
4139           i.types[0].bitfield.imm32 = 1;
4140           i.types[0].bitfield.imm32s = 0;
4141           i.types[0].bitfield.imm64 = 0;
4142           i.types[1].bitfield.dword = 1;
4143           i.types[1].bitfield.qword = 0;
4144           if ((i.tm.base_opcode | 1) == 0xc7)
4145             {
4146               /* Handle
4147                    movq $imm31, %r64   -> movl $imm31, %r32
4148                */
4149               i.tm.base_opcode = 0xb8;
4150               i.tm.extension_opcode = None;
4151               i.tm.opcode_modifier.w = 0;
4152               i.tm.opcode_modifier.modrm = 0;
4153             }
4154         }
4155     }
4156   else if (optimize > 1
4157            && !optimize_for_space
4158            && !is_any_vex_encoding (&i.tm)
4159            && i.reg_operands == 2
4160            && i.op[0].regs == i.op[1].regs
4161            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164     {
4165       /* Optimize: -O2:
4166            andb %rN, %rN  -> testb %rN, %rN
4167            andw %rN, %rN  -> testw %rN, %rN
4168            andq %rN, %rN  -> testq %rN, %rN
4169            orb %rN, %rN   -> testb %rN, %rN
4170            orw %rN, %rN   -> testw %rN, %rN
4171            orq %rN, %rN   -> testq %rN, %rN
4172
4173            and outside of 64-bit mode
4174
4175            andl %rN, %rN  -> testl %rN, %rN
4176            orl %rN, %rN   -> testl %rN, %rN
4177        */
4178       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179     }
4180   else if (i.reg_operands == 3
4181            && i.op[0].regs == i.op[1].regs
4182            && !i.types[2].bitfield.xmmword
4183            && (i.tm.opcode_modifier.vex
4184                || ((!i.mask || i.mask->zeroing)
4185                    && !i.rounding
4186                    && is_evex_encoding (&i.tm)
4187                    && (i.vec_encoding != vex_encoding_evex
4188                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4189                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4190                        || (i.tm.operand_types[2].bitfield.zmmword
4191                            && i.types[2].bitfield.ymmword))))
4192            && ((i.tm.base_opcode == 0x55
4193                 || i.tm.base_opcode == 0x6655
4194                 || i.tm.base_opcode == 0x66df
4195                 || i.tm.base_opcode == 0x57
4196                 || i.tm.base_opcode == 0x6657
4197                 || i.tm.base_opcode == 0x66ef
4198                 || i.tm.base_opcode == 0x66f8
4199                 || i.tm.base_opcode == 0x66f9
4200                 || i.tm.base_opcode == 0x66fa
4201                 || i.tm.base_opcode == 0x66fb
4202                 || i.tm.base_opcode == 0x42
4203                 || i.tm.base_opcode == 0x6642
4204                 || i.tm.base_opcode == 0x47
4205                 || i.tm.base_opcode == 0x6647)
4206                && i.tm.extension_opcode == None))
4207     {
4208       /* Optimize: -O1:
4209            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210            vpsubq and vpsubw:
4211              EVEX VOP %zmmM, %zmmM, %zmmN
4212                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4213                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4214              EVEX VOP %ymmM, %ymmM, %ymmN
4215                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4216                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4217              VEX VOP %ymmM, %ymmM, %ymmN
4218                -> VEX VOP %xmmM, %xmmM, %xmmN
4219            VOP, one of vpandn and vpxor:
4220              VEX VOP %ymmM, %ymmM, %ymmN
4221                -> VEX VOP %xmmM, %xmmM, %xmmN
4222            VOP, one of vpandnd and vpandnq:
4223              EVEX VOP %zmmM, %zmmM, %zmmN
4224                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4225                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4226              EVEX VOP %ymmM, %ymmM, %ymmN
4227                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4228                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229            VOP, one of vpxord and vpxorq:
4230              EVEX VOP %zmmM, %zmmM, %zmmN
4231                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4232                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4233              EVEX VOP %ymmM, %ymmM, %ymmN
4234                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4235                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4236            VOP, one of kxord and kxorq:
4237              VEX VOP %kM, %kM, %kN
4238                -> VEX kxorw %kM, %kM, %kN
4239            VOP, one of kandnd and kandnq:
4240              VEX VOP %kM, %kM, %kN
4241                -> VEX kandnw %kM, %kM, %kN
4242        */
4243       if (is_evex_encoding (&i.tm))
4244         {
4245           if (i.vec_encoding != vex_encoding_evex)
4246             {
4247               i.tm.opcode_modifier.vex = VEX128;
4248               i.tm.opcode_modifier.vexw = VEXW0;
4249               i.tm.opcode_modifier.evex = 0;
4250             }
4251           else if (optimize > 1)
4252             i.tm.opcode_modifier.evex = EVEX128;
4253           else
4254             return;
4255         }
4256       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4257         {
4258           i.tm.base_opcode &= 0xff;
4259           i.tm.opcode_modifier.vexw = VEXW0;
4260         }
4261       else
4262         i.tm.opcode_modifier.vex = VEX128;
4263
4264       if (i.tm.opcode_modifier.vex)
4265         for (j = 0; j < 3; j++)
4266           {
4267             i.types[j].bitfield.xmmword = 1;
4268             i.types[j].bitfield.ymmword = 0;
4269           }
4270     }
4271   else if (i.vec_encoding != vex_encoding_evex
4272            && !i.types[0].bitfield.zmmword
4273            && !i.types[1].bitfield.zmmword
4274            && !i.mask
4275            && !i.broadcast
4276            && is_evex_encoding (&i.tm)
4277            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4279                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280                || (i.tm.base_opcode & ~4) == 0x66db
4281                || (i.tm.base_opcode & ~4) == 0x66eb)
4282            && i.tm.extension_opcode == None)
4283     {
4284       /* Optimize: -O1:
4285            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286            vmovdqu32 and vmovdqu64:
4287              EVEX VOP %xmmM, %xmmN
4288                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289              EVEX VOP %ymmM, %ymmN
4290                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291              EVEX VOP %xmmM, mem
4292                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293              EVEX VOP %ymmM, mem
4294                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295              EVEX VOP mem, %xmmN
4296                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297              EVEX VOP mem, %ymmN
4298                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4299            VOP, one of vpand, vpandn, vpor, vpxor:
4300              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304              EVEX VOP{d,q} mem, %xmmM, %xmmN
4305                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306              EVEX VOP{d,q} mem, %ymmM, %ymmN
4307                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4308        */
4309       for (j = 0; j < i.operands; j++)
4310         if (operand_type_check (i.types[j], disp)
4311             && i.op[j].disps->X_op == O_constant)
4312           {
4313             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4316             int evex_disp8, vex_disp8;
4317             unsigned int memshift = i.memshift;
4318             offsetT n = i.op[j].disps->X_add_number;
4319
4320             evex_disp8 = fits_in_disp8 (n);
4321             i.memshift = 0;
4322             vex_disp8 = fits_in_disp8 (n);
4323             if (evex_disp8 != vex_disp8)
4324               {
4325                 i.memshift = memshift;
4326                 return;
4327               }
4328
4329             i.types[j].bitfield.disp8 = vex_disp8;
4330             break;
4331           }
4332       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4334       i.tm.opcode_modifier.vex
4335         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336       i.tm.opcode_modifier.vexw = VEXW0;
4337       /* VPAND, VPOR, and VPXOR are commutative.  */
4338       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339         i.tm.opcode_modifier.commutative = 1;
4340       i.tm.opcode_modifier.evex = 0;
4341       i.tm.opcode_modifier.masking = 0;
4342       i.tm.opcode_modifier.broadcast = 0;
4343       i.tm.opcode_modifier.disp8memshift = 0;
4344       i.memshift = 0;
4345       if (j < i.operands)
4346         i.types[j].bitfield.disp8
4347           = fits_in_disp8 (i.op[j].disps->X_add_number);
4348     }
4349 }
4350
4351 /* Return non-zero for load instruction.  */
4352
4353 static int
4354 load_insn_p (void)
4355 {
4356   unsigned int dest;
4357   int any_vex_p = is_any_vex_encoding (&i.tm);
4358   unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360   if (!any_vex_p)
4361     {
4362       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4365       if (i.tm.opcode_modifier.anysize)
4366         return 0;
4367
4368       /* pop, popf, popa.   */
4369       if (strcmp (i.tm.name, "pop") == 0
4370           || i.tm.base_opcode == 0x9d
4371           || i.tm.base_opcode == 0x61)
4372         return 1;
4373
4374       /* movs, cmps, lods, scas.  */
4375       if ((i.tm.base_opcode | 0xb) == 0xaf)
4376         return 1;
4377
4378       /* outs, xlatb.  */
4379       if (base_opcode == 0x6f
4380           || i.tm.base_opcode == 0xd7)
4381         return 1;
4382       /* NB: For AMD-specific insns with implicit memory operands,
4383          they're intentionally not covered.  */
4384     }
4385
4386   /* No memory operand.  */
4387   if (!i.mem_operands)
4388     return 0;
4389
4390   if (any_vex_p)
4391     {
4392       /* vldmxcsr.  */
4393       if (i.tm.base_opcode == 0xae
4394           && i.tm.opcode_modifier.vex
4395           && i.tm.opcode_modifier.vexopcode == VEX0F
4396           && i.tm.extension_opcode == 2)
4397         return 1;
4398     }
4399   else
4400     {
4401       /* test, not, neg, mul, imul, div, idiv.  */
4402       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403           && i.tm.extension_opcode != 1)
4404         return 1;
4405
4406       /* inc, dec.  */
4407       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408         return 1;
4409
4410       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4411       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412         return 1;
4413
4414       /* bt, bts, btr, btc.  */
4415       if (i.tm.base_opcode == 0xfba
4416           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417         return 1;
4418
4419       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420       if ((base_opcode == 0xc1
4421            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422           && i.tm.extension_opcode != 6)
4423         return 1;
4424
4425       /* cmpxchg8b, cmpxchg16b, xrstors.  */
4426       if (i.tm.base_opcode == 0xfc7
4427           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428         return 1;
4429
4430       /* fxrstor, ldmxcsr, xrstor.  */
4431       if (i.tm.base_opcode == 0xfae
4432           && (i.tm.extension_opcode == 1
4433               || i.tm.extension_opcode == 2
4434               || i.tm.extension_opcode == 5))
4435         return 1;
4436
4437       /* lgdt, lidt, lmsw.  */
4438       if (i.tm.base_opcode == 0xf01
4439           && (i.tm.extension_opcode == 2
4440               || i.tm.extension_opcode == 3
4441               || i.tm.extension_opcode == 6))
4442         return 1;
4443
4444       /* vmptrld */
4445       if (i.tm.base_opcode == 0xfc7
4446           && i.tm.extension_opcode == 6)
4447         return 1;
4448
4449       /* Check for x87 instructions.  */
4450       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451         {
4452           /* Skip fst, fstp, fstenv, fstcw.  */
4453           if (i.tm.base_opcode == 0xd9
4454               && (i.tm.extension_opcode == 2
4455                   || i.tm.extension_opcode == 3
4456                   || i.tm.extension_opcode == 6
4457                   || i.tm.extension_opcode == 7))
4458             return 0;
4459
4460           /* Skip fisttp, fist, fistp, fstp.  */
4461           if (i.tm.base_opcode == 0xdb
4462               && (i.tm.extension_opcode == 1
4463                   || i.tm.extension_opcode == 2
4464                   || i.tm.extension_opcode == 3
4465                   || i.tm.extension_opcode == 7))
4466             return 0;
4467
4468           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4469           if (i.tm.base_opcode == 0xdd
4470               && (i.tm.extension_opcode == 1
4471                   || i.tm.extension_opcode == 2
4472                   || i.tm.extension_opcode == 3
4473                   || i.tm.extension_opcode == 6
4474                   || i.tm.extension_opcode == 7))
4475             return 0;
4476
4477           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4478           if (i.tm.base_opcode == 0xdf
4479               && (i.tm.extension_opcode == 1
4480                   || i.tm.extension_opcode == 2
4481                   || i.tm.extension_opcode == 3
4482                   || i.tm.extension_opcode == 6
4483                   || i.tm.extension_opcode == 7))
4484             return 0;
4485
4486           return 1;
4487         }
4488     }
4489
4490   dest = i.operands - 1;
4491
4492   /* Check fake imm8 operand and 3 source operands.  */
4493   if ((i.tm.opcode_modifier.immext
4494        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495       && i.types[dest].bitfield.imm8)
4496     dest--;
4497
4498   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4499   if (!any_vex_p
4500       && (base_opcode == 0x1
4501           || base_opcode == 0x9
4502           || base_opcode == 0x11
4503           || base_opcode == 0x19
4504           || base_opcode == 0x21
4505           || base_opcode == 0x29
4506           || base_opcode == 0x31
4507           || base_opcode == 0x39
4508           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509           || base_opcode == 0xfc1))
4510     return 1;
4511
4512   /* Check for load instruction.  */
4513   return (i.types[dest].bitfield.class != ClassNone
4514           || i.types[dest].bitfield.instance == Accum);
4515 }
4516
4517 /* Output lfence, 0xfaee8, after instruction.  */
4518
4519 static void
4520 insert_lfence_after (void)
4521 {
4522   if (lfence_after_load && load_insn_p ())
4523     {
4524       /* There are also two REP string instructions that require
4525          special treatment. Specifically, the compare string (CMPS)
4526          and scan string (SCAS) instructions set EFLAGS in a manner
4527          that depends on the data being compared/scanned. When used
4528          with a REP prefix, the number of iterations may therefore
4529          vary depending on this data. If the data is a program secret
4530          chosen by the adversary using an LVI method,
4531          then this data-dependent behavior may leak some aspect
4532          of the secret.  */
4533       if (((i.tm.base_opcode | 0x1) == 0xa7
4534            || (i.tm.base_opcode | 0x1) == 0xaf)
4535           && i.prefix[REP_PREFIX])
4536         {
4537             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538                      i.tm.name);
4539         }
4540       char *p = frag_more (3);
4541       *p++ = 0xf;
4542       *p++ = 0xae;
4543       *p = 0xe8;
4544     }
4545 }
4546
4547 /* Output lfence, 0xfaee8, before instruction.  */
4548
4549 static void
4550 insert_lfence_before (void)
4551 {
4552   char *p;
4553
4554   if (is_any_vex_encoding (&i.tm))
4555     return;
4556
4557   if (i.tm.base_opcode == 0xff
4558       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559     {
4560       /* Insert lfence before indirect branch if needed.  */
4561
4562       if (lfence_before_indirect_branch == lfence_branch_none)
4563         return;
4564
4565       if (i.operands != 1)
4566         abort ();
4567
4568       if (i.reg_operands == 1)
4569         {
4570           /* Indirect branch via register.  Don't insert lfence with
4571              -mlfence-after-load=yes.  */
4572           if (lfence_after_load
4573               || lfence_before_indirect_branch == lfence_branch_memory)
4574             return;
4575         }
4576       else if (i.mem_operands == 1
4577                && lfence_before_indirect_branch != lfence_branch_register)
4578         {
4579           as_warn (_("indirect `%s` with memory operand should be avoided"),
4580                    i.tm.name);
4581           return;
4582         }
4583       else
4584         return;
4585
4586       if (last_insn.kind != last_insn_other
4587           && last_insn.seg == now_seg)
4588         {
4589           as_warn_where (last_insn.file, last_insn.line,
4590                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591                          last_insn.name, i.tm.name);
4592           return;
4593         }
4594
4595       p = frag_more (3);
4596       *p++ = 0xf;
4597       *p++ = 0xae;
4598       *p = 0xe8;
4599       return;
4600     }
4601
4602   /* Output or/not/shl and lfence before near ret.  */
4603   if (lfence_before_ret != lfence_before_ret_none
4604       && (i.tm.base_opcode == 0xc2
4605           || i.tm.base_opcode == 0xc3))
4606     {
4607       if (last_insn.kind != last_insn_other
4608           && last_insn.seg == now_seg)
4609         {
4610           as_warn_where (last_insn.file, last_insn.line,
4611                          _("`%s` skips -mlfence-before-ret on `%s`"),
4612                          last_insn.name, i.tm.name);
4613           return;
4614         }
4615
4616       /* Near ret ingore operand size override under CPU64.  */
4617       char prefix = flag_code == CODE_64BIT
4618                     ? 0x48
4619                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4620
4621       if (lfence_before_ret == lfence_before_ret_not)
4622         {
4623           /* not: 0xf71424, may add prefix
4624              for operand size override or 64-bit code.  */
4625           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626           if (prefix)
4627             *p++ = prefix;
4628           *p++ = 0xf7;
4629           *p++ = 0x14;
4630           *p++ = 0x24;
4631           if (prefix)
4632             *p++ = prefix;
4633           *p++ = 0xf7;
4634           *p++ = 0x14;
4635           *p++ = 0x24;
4636         }
4637       else
4638         {
4639           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640           if (prefix)
4641             *p++ = prefix;
4642           if (lfence_before_ret == lfence_before_ret_or)
4643             {
4644               /* or: 0x830c2400, may add prefix
4645                  for operand size override or 64-bit code.  */
4646               *p++ = 0x83;
4647               *p++ = 0x0c;
4648             }
4649           else
4650             {
4651               /* shl: 0xc1242400, may add prefix
4652                  for operand size override or 64-bit code.  */
4653               *p++ = 0xc1;
4654               *p++ = 0x24;
4655             }
4656
4657           *p++ = 0x24;
4658           *p++ = 0x0;
4659         }
4660
4661       *p++ = 0xf;
4662       *p++ = 0xae;
4663       *p = 0xe8;
4664     }
4665 }
4666
4667 /* This is the guts of the machine-dependent assembler.  LINE points to a
4668    machine dependent instruction.  This function is supposed to emit
4669    the frags/bytes it assembles to.  */
4670
4671 void
4672 md_assemble (char *line)
4673 {
4674   unsigned int j;
4675   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4676   const insn_template *t;
4677
4678   /* Initialize globals.  */
4679   memset (&i, '\0', sizeof (i));
4680   for (j = 0; j < MAX_OPERANDS; j++)
4681     i.reloc[j] = NO_RELOC;
4682   memset (disp_expressions, '\0', sizeof (disp_expressions));
4683   memset (im_expressions, '\0', sizeof (im_expressions));
4684   save_stack_p = save_stack;
4685
4686   /* First parse an instruction mnemonic & call i386_operand for the operands.
4687      We assume that the scrubber has arranged it so that line[0] is the valid
4688      start of a (possibly prefixed) mnemonic.  */
4689
4690   line = parse_insn (line, mnemonic);
4691   if (line == NULL)
4692     return;
4693   mnem_suffix = i.suffix;
4694
4695   line = parse_operands (line, mnemonic);
4696   this_operand = -1;
4697   xfree (i.memop1_string);
4698   i.memop1_string = NULL;
4699   if (line == NULL)
4700     return;
4701
4702   /* Now we've parsed the mnemonic into a set of templates, and have the
4703      operands at hand.  */
4704
4705   /* All Intel opcodes have reversed operands except for "bound", "enter",
4706      "monitor*", "mwait*", "tpause", and "umwait".  We also don't reverse
4707      intersegment "jmp" and "call" instructions with 2 immediate operands so
4708      that the immediate segment precedes the offset, as it does when in AT&T
4709      mode.  */
4710   if (intel_syntax
4711       && i.operands > 1
4712       && (strcmp (mnemonic, "bound") != 0)
4713       && (strcmp (mnemonic, "invlpga") != 0)
4714       && (strncmp (mnemonic, "monitor", 7) != 0)
4715       && (strncmp (mnemonic, "mwait", 5) != 0)
4716       && (strcmp (mnemonic, "tpause") != 0)
4717       && (strcmp (mnemonic, "umwait") != 0)
4718       && !(operand_type_check (i.types[0], imm)
4719            && operand_type_check (i.types[1], imm)))
4720     swap_operands ();
4721
4722   /* The order of the immediates should be reversed
4723      for 2 immediates extrq and insertq instructions */
4724   if (i.imm_operands == 2
4725       && (strcmp (mnemonic, "extrq") == 0
4726           || strcmp (mnemonic, "insertq") == 0))
4727       swap_2_operands (0, 1);
4728
4729   if (i.imm_operands)
4730     optimize_imm ();
4731
4732   /* Don't optimize displacement for movabs since it only takes 64bit
4733      displacement.  */
4734   if (i.disp_operands
4735       && i.disp_encoding != disp_encoding_32bit
4736       && (flag_code != CODE_64BIT
4737           || strcmp (mnemonic, "movabs") != 0))
4738     optimize_disp ();
4739
4740   /* Next, we find a template that matches the given insn,
4741      making sure the overlap of the given operands types is consistent
4742      with the template operand types.  */
4743
4744   if (!(t = match_template (mnem_suffix)))
4745     return;
4746
4747   if (sse_check != check_none
4748       && !i.tm.opcode_modifier.noavx
4749       && !i.tm.cpu_flags.bitfield.cpuavx
4750       && !i.tm.cpu_flags.bitfield.cpuavx512f
4751       && (i.tm.cpu_flags.bitfield.cpusse
4752           || i.tm.cpu_flags.bitfield.cpusse2
4753           || i.tm.cpu_flags.bitfield.cpusse3
4754           || i.tm.cpu_flags.bitfield.cpussse3
4755           || i.tm.cpu_flags.bitfield.cpusse4_1
4756           || i.tm.cpu_flags.bitfield.cpusse4_2
4757           || i.tm.cpu_flags.bitfield.cpupclmul
4758           || i.tm.cpu_flags.bitfield.cpuaes
4759           || i.tm.cpu_flags.bitfield.cpusha
4760           || i.tm.cpu_flags.bitfield.cpugfni))
4761     {
4762       (sse_check == check_warning
4763        ? as_warn
4764        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765     }
4766
4767   if (i.tm.opcode_modifier.fwait)
4768     if (!add_prefix (FWAIT_OPCODE))
4769       return;
4770
4771   /* Check if REP prefix is OK.  */
4772   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773     {
4774       as_bad (_("invalid instruction `%s' after `%s'"),
4775                 i.tm.name, i.rep_prefix);
4776       return;
4777     }
4778
4779   /* Check for lock without a lockable instruction.  Destination operand
4780      must be memory unless it is xchg (0x86).  */
4781   if (i.prefix[LOCK_PREFIX]
4782       && (!i.tm.opcode_modifier.islockable
4783           || i.mem_operands == 0
4784           || (i.tm.base_opcode != 0x86
4785               && !(i.flags[i.operands - 1] & Operand_Mem))))
4786     {
4787       as_bad (_("expecting lockable instruction after `lock'"));
4788       return;
4789     }
4790
4791   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4792   if (i.prefix[DATA_PREFIX]
4793       && (is_any_vex_encoding (&i.tm)
4794           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4796     {
4797       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798       return;
4799     }
4800
4801   /* Check if HLE prefix is OK.  */
4802   if (i.hle_prefix && !check_hle ())
4803     return;
4804
4805   /* Check BND prefix.  */
4806   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807     as_bad (_("expecting valid branch instruction after `bnd'"));
4808
4809   /* Check NOTRACK prefix.  */
4810   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811     as_bad (_("expecting indirect branch instruction after `notrack'"));
4812
4813   if (i.tm.cpu_flags.bitfield.cpumpx)
4814     {
4815       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817       else if (flag_code != CODE_16BIT
4818                ? i.prefix[ADDR_PREFIX]
4819                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821     }
4822
4823   /* Insert BND prefix.  */
4824   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825     {
4826       if (!i.prefix[BND_PREFIX])
4827         add_prefix (BND_PREFIX_OPCODE);
4828       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829         {
4830           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832         }
4833     }
4834
4835   /* Check string instruction segment overrides.  */
4836   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4837     {
4838       gas_assert (i.mem_operands);
4839       if (!check_string ())
4840         return;
4841       i.disp_operands = 0;
4842     }
4843
4844   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845     optimize_encoding ();
4846
4847   if (!process_suffix ())
4848     return;
4849
4850   /* Update operand types and check extended states.  */
4851   for (j = 0; j < i.operands; j++)
4852     {
4853       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4854       switch (i.tm.operand_types[j].bitfield.class)
4855         {
4856         default:
4857           break;
4858         case RegMMX:
4859           i.xstate |= xstate_mmx;
4860           break;
4861         case RegMask:
4862           i.xstate |= xstate_zmm;
4863           break;
4864         case RegSIMD:
4865           if (i.tm.operand_types[j].bitfield.tmmword)
4866             i.xstate |= xstate_tmm;
4867           else if (i.tm.operand_types[j].bitfield.zmmword)
4868             i.xstate |= xstate_zmm;
4869           else if (i.tm.operand_types[j].bitfield.ymmword)
4870             i.xstate |= xstate_ymm;
4871           else if (i.tm.operand_types[j].bitfield.xmmword)
4872             i.xstate |= xstate_xmm;
4873           break;
4874         }
4875     }
4876
4877   /* Make still unresolved immediate matches conform to size of immediate
4878      given in i.suffix.  */
4879   if (!finalize_imm ())
4880     return;
4881
4882   if (i.types[0].bitfield.imm1)
4883     i.imm_operands = 0; /* kludge for shift insns.  */
4884
4885   /* We only need to check those implicit registers for instructions
4886      with 3 operands or less.  */
4887   if (i.operands <= 3)
4888     for (j = 0; j < i.operands; j++)
4889       if (i.types[j].bitfield.instance != InstanceNone
4890           && !i.types[j].bitfield.xmmword)
4891         i.reg_operands--;
4892
4893   /* For insns with operands there are more diddles to do to the opcode.  */
4894   if (i.operands)
4895     {
4896       if (!process_operands ())
4897         return;
4898     }
4899   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4900     {
4901       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4902       as_warn (_("translating to `%sp'"), i.tm.name);
4903     }
4904
4905   if (is_any_vex_encoding (&i.tm))
4906     {
4907       if (!cpu_arch_flags.bitfield.cpui286)
4908         {
4909           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4910                   i.tm.name);
4911           return;
4912         }
4913
4914       /* Check for explicit REX prefix.  */
4915       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4916         {
4917           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4918           return;
4919         }
4920
4921       if (i.tm.opcode_modifier.vex)
4922         build_vex_prefix (t);
4923       else
4924         build_evex_prefix ();
4925
4926       /* The individual REX.RXBW bits got consumed.  */
4927       i.rex &= REX_OPCODE;
4928     }
4929
4930   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4931      instructions may define INT_OPCODE as well, so avoid this corner
4932      case for those instructions that use MODRM.  */
4933   if (i.tm.base_opcode == INT_OPCODE
4934       && !i.tm.opcode_modifier.modrm
4935       && i.op[0].imms->X_add_number == 3)
4936     {
4937       i.tm.base_opcode = INT3_OPCODE;
4938       i.imm_operands = 0;
4939     }
4940
4941   if ((i.tm.opcode_modifier.jump == JUMP
4942        || i.tm.opcode_modifier.jump == JUMP_BYTE
4943        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4944       && i.op[0].disps->X_op == O_constant)
4945     {
4946       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4947          the absolute address given by the constant.  Since ix86 jumps and
4948          calls are pc relative, we need to generate a reloc.  */
4949       i.op[0].disps->X_add_symbol = &abs_symbol;
4950       i.op[0].disps->X_op = O_symbol;
4951     }
4952
4953   /* For 8 bit registers we need an empty rex prefix.  Also if the
4954      instruction already has a prefix, we need to convert old
4955      registers to new ones.  */
4956
4957   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4958        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4959       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4960           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4961       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4962            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4963           && i.rex != 0))
4964     {
4965       int x;
4966
4967       i.rex |= REX_OPCODE;
4968       for (x = 0; x < 2; x++)
4969         {
4970           /* Look for 8 bit operand that uses old registers.  */
4971           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4972               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4973             {
4974               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4975               /* In case it is "hi" register, give up.  */
4976               if (i.op[x].regs->reg_num > 3)
4977                 as_bad (_("can't encode register '%s%s' in an "
4978                           "instruction requiring REX prefix."),
4979                         register_prefix, i.op[x].regs->reg_name);
4980
4981               /* Otherwise it is equivalent to the extended register.
4982                  Since the encoding doesn't change this is merely
4983                  cosmetic cleanup for debug output.  */
4984
4985               i.op[x].regs = i.op[x].regs + 8;
4986             }
4987         }
4988     }
4989
4990   if (i.rex == 0 && i.rex_encoding)
4991     {
4992       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4993          that uses legacy register.  If it is "hi" register, don't add
4994          the REX_OPCODE byte.  */
4995       int x;
4996       for (x = 0; x < 2; x++)
4997         if (i.types[x].bitfield.class == Reg
4998             && i.types[x].bitfield.byte
4999             && (i.op[x].regs->reg_flags & RegRex64) == 0
5000             && i.op[x].regs->reg_num > 3)
5001           {
5002             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5003             i.rex_encoding = FALSE;
5004             break;
5005           }
5006
5007       if (i.rex_encoding)
5008         i.rex = REX_OPCODE;
5009     }
5010
5011   if (i.rex != 0)
5012     add_prefix (REX_OPCODE | i.rex);
5013
5014   insert_lfence_before ();
5015
5016   /* We are ready to output the insn.  */
5017   output_insn ();
5018
5019   insert_lfence_after ();
5020
5021   last_insn.seg = now_seg;
5022
5023   if (i.tm.opcode_modifier.isprefix)
5024     {
5025       last_insn.kind = last_insn_prefix;
5026       last_insn.name = i.tm.name;
5027       last_insn.file = as_where (&last_insn.line);
5028     }
5029   else
5030     last_insn.kind = last_insn_other;
5031 }
5032
5033 static char *
5034 parse_insn (char *line, char *mnemonic)
5035 {
5036   char *l = line;
5037   char *token_start = l;
5038   char *mnem_p;
5039   int supported;
5040   const insn_template *t;
5041   char *dot_p = NULL;
5042
5043   while (1)
5044     {
5045       mnem_p = mnemonic;
5046       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5047         {
5048           if (*mnem_p == '.')
5049             dot_p = mnem_p;
5050           mnem_p++;
5051           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5052             {
5053               as_bad (_("no such instruction: `%s'"), token_start);
5054               return NULL;
5055             }
5056           l++;
5057         }
5058       if (!is_space_char (*l)
5059           && *l != END_OF_INSN
5060           && (intel_syntax
5061               || (*l != PREFIX_SEPARATOR
5062                   && *l != ',')))
5063         {
5064           as_bad (_("invalid character %s in mnemonic"),
5065                   output_invalid (*l));
5066           return NULL;
5067         }
5068       if (token_start == l)
5069         {
5070           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5071             as_bad (_("expecting prefix; got nothing"));
5072           else
5073             as_bad (_("expecting mnemonic; got nothing"));
5074           return NULL;
5075         }
5076
5077       /* Look up instruction (or prefix) via hash table.  */
5078       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5079
5080       if (*l != END_OF_INSN
5081           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5082           && current_templates
5083           && current_templates->start->opcode_modifier.isprefix)
5084         {
5085           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5086             {
5087               as_bad ((flag_code != CODE_64BIT
5088                        ? _("`%s' is only supported in 64-bit mode")
5089                        : _("`%s' is not supported in 64-bit mode")),
5090                       current_templates->start->name);
5091               return NULL;
5092             }
5093           /* If we are in 16-bit mode, do not allow addr16 or data16.
5094              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5095           if ((current_templates->start->opcode_modifier.size == SIZE16
5096                || current_templates->start->opcode_modifier.size == SIZE32)
5097               && flag_code != CODE_64BIT
5098               && ((current_templates->start->opcode_modifier.size == SIZE32)
5099                   ^ (flag_code == CODE_16BIT)))
5100             {
5101               as_bad (_("redundant %s prefix"),
5102                       current_templates->start->name);
5103               return NULL;
5104             }
5105           if (current_templates->start->opcode_length == 0)
5106             {
5107               /* Handle pseudo prefixes.  */
5108               switch (current_templates->start->base_opcode)
5109                 {
5110                 case Prefix_Disp8:
5111                   /* {disp8} */
5112                   i.disp_encoding = disp_encoding_8bit;
5113                   break;
5114                 case Prefix_Disp16:
5115                   /* {disp16} */
5116                   i.disp_encoding = disp_encoding_16bit;
5117                   break;
5118                 case Prefix_Disp32:
5119                   /* {disp32} */
5120                   i.disp_encoding = disp_encoding_32bit;
5121                   break;
5122                 case Prefix_Load:
5123                   /* {load} */
5124                   i.dir_encoding = dir_encoding_load;
5125                   break;
5126                 case Prefix_Store:
5127                   /* {store} */
5128                   i.dir_encoding = dir_encoding_store;
5129                   break;
5130                 case Prefix_VEX:
5131                   /* {vex} */
5132                   i.vec_encoding = vex_encoding_vex;
5133                   break;
5134                 case Prefix_VEX3:
5135                   /* {vex3} */
5136                   i.vec_encoding = vex_encoding_vex3;
5137                   break;
5138                 case Prefix_EVEX:
5139                   /* {evex} */
5140                   i.vec_encoding = vex_encoding_evex;
5141                   break;
5142                 case Prefix_REX:
5143                   /* {rex} */
5144                   i.rex_encoding = TRUE;
5145                   break;
5146                 case Prefix_NoOptimize:
5147                   /* {nooptimize} */
5148                   i.no_optimize = TRUE;
5149                   break;
5150                 default:
5151                   abort ();
5152                 }
5153             }
5154           else
5155             {
5156               /* Add prefix, checking for repeated prefixes.  */
5157               switch (add_prefix (current_templates->start->base_opcode))
5158                 {
5159                 case PREFIX_EXIST:
5160                   return NULL;
5161                 case PREFIX_DS:
5162                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5163                     i.notrack_prefix = current_templates->start->name;
5164                   break;
5165                 case PREFIX_REP:
5166                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5167                     i.hle_prefix = current_templates->start->name;
5168                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5169                     i.bnd_prefix = current_templates->start->name;
5170                   else
5171                     i.rep_prefix = current_templates->start->name;
5172                   break;
5173                 default:
5174                   break;
5175                 }
5176             }
5177           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5178           token_start = ++l;
5179         }
5180       else
5181         break;
5182     }
5183
5184   if (!current_templates)
5185     {
5186       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5187          Check if we should swap operand or force 32bit displacement in
5188          encoding.  */
5189       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5190         i.dir_encoding = dir_encoding_swap;
5191       else if (mnem_p - 3 == dot_p
5192                && dot_p[1] == 'd'
5193                && dot_p[2] == '8')
5194         i.disp_encoding = disp_encoding_8bit;
5195       else if (mnem_p - 4 == dot_p
5196                && dot_p[1] == 'd'
5197                && dot_p[2] == '3'
5198                && dot_p[3] == '2')
5199         i.disp_encoding = disp_encoding_32bit;
5200       else
5201         goto check_suffix;
5202       mnem_p = dot_p;
5203       *dot_p = '\0';
5204       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5205     }
5206
5207   if (!current_templates)
5208     {
5209     check_suffix:
5210       if (mnem_p > mnemonic)
5211         {
5212           /* See if we can get a match by trimming off a suffix.  */
5213           switch (mnem_p[-1])
5214             {
5215             case WORD_MNEM_SUFFIX:
5216               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5217                 i.suffix = SHORT_MNEM_SUFFIX;
5218               else
5219                 /* Fall through.  */
5220               case BYTE_MNEM_SUFFIX:
5221               case QWORD_MNEM_SUFFIX:
5222                 i.suffix = mnem_p[-1];
5223               mnem_p[-1] = '\0';
5224               current_templates
5225                 = (const templates *) str_hash_find (op_hash, mnemonic);
5226               break;
5227             case SHORT_MNEM_SUFFIX:
5228             case LONG_MNEM_SUFFIX:
5229               if (!intel_syntax)
5230                 {
5231                   i.suffix = mnem_p[-1];
5232                   mnem_p[-1] = '\0';
5233                   current_templates
5234                     = (const templates *) str_hash_find (op_hash, mnemonic);
5235                 }
5236               break;
5237
5238               /* Intel Syntax.  */
5239             case 'd':
5240               if (intel_syntax)
5241                 {
5242                   if (intel_float_operand (mnemonic) == 1)
5243                     i.suffix = SHORT_MNEM_SUFFIX;
5244                   else
5245                     i.suffix = LONG_MNEM_SUFFIX;
5246                   mnem_p[-1] = '\0';
5247                   current_templates
5248                     = (const templates *) str_hash_find (op_hash, mnemonic);
5249                 }
5250               break;
5251             }
5252         }
5253
5254       if (!current_templates)
5255         {
5256           as_bad (_("no such instruction: `%s'"), token_start);
5257           return NULL;
5258         }
5259     }
5260
5261   if (current_templates->start->opcode_modifier.jump == JUMP
5262       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5263     {
5264       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5265          predict taken and predict not taken respectively.
5266          I'm not sure that branch hints actually do anything on loop
5267          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5268          may work in the future and it doesn't hurt to accept them
5269          now.  */
5270       if (l[0] == ',' && l[1] == 'p')
5271         {
5272           if (l[2] == 't')
5273             {
5274               if (!add_prefix (DS_PREFIX_OPCODE))
5275                 return NULL;
5276               l += 3;
5277             }
5278           else if (l[2] == 'n')
5279             {
5280               if (!add_prefix (CS_PREFIX_OPCODE))
5281                 return NULL;
5282               l += 3;
5283             }
5284         }
5285     }
5286   /* Any other comma loses.  */
5287   if (*l == ',')
5288     {
5289       as_bad (_("invalid character %s in mnemonic"),
5290               output_invalid (*l));
5291       return NULL;
5292     }
5293
5294   /* Check if instruction is supported on specified architecture.  */
5295   supported = 0;
5296   for (t = current_templates->start; t < current_templates->end; ++t)
5297     {
5298       supported |= cpu_flags_match (t);
5299       if (supported == CPU_FLAGS_PERFECT_MATCH)
5300         {
5301           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5302             as_warn (_("use .code16 to ensure correct addressing mode"));
5303
5304           return l;
5305         }
5306     }
5307
5308   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5309     as_bad (flag_code == CODE_64BIT
5310             ? _("`%s' is not supported in 64-bit mode")
5311             : _("`%s' is only supported in 64-bit mode"),
5312             current_templates->start->name);
5313   else
5314     as_bad (_("`%s' is not supported on `%s%s'"),
5315             current_templates->start->name,
5316             cpu_arch_name ? cpu_arch_name : default_arch,
5317             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5318
5319   return NULL;
5320 }
5321
5322 static char *
5323 parse_operands (char *l, const char *mnemonic)
5324 {
5325   char *token_start;
5326
5327   /* 1 if operand is pending after ','.  */
5328   unsigned int expecting_operand = 0;
5329
5330   /* Non-zero if operand parens not balanced.  */
5331   unsigned int paren_not_balanced;
5332
5333   while (*l != END_OF_INSN)
5334     {
5335       /* Skip optional white space before operand.  */
5336       if (is_space_char (*l))
5337         ++l;
5338       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5339         {
5340           as_bad (_("invalid character %s before operand %d"),
5341                   output_invalid (*l),
5342                   i.operands + 1);
5343           return NULL;
5344         }
5345       token_start = l;  /* After white space.  */
5346       paren_not_balanced = 0;
5347       while (paren_not_balanced || *l != ',')
5348         {
5349           if (*l == END_OF_INSN)
5350             {
5351               if (paren_not_balanced)
5352                 {
5353                   if (!intel_syntax)
5354                     as_bad (_("unbalanced parenthesis in operand %d."),
5355                             i.operands + 1);
5356                   else
5357                     as_bad (_("unbalanced brackets in operand %d."),
5358                             i.operands + 1);
5359                   return NULL;
5360                 }
5361               else
5362                 break;  /* we are done */
5363             }
5364           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5365             {
5366               as_bad (_("invalid character %s in operand %d"),
5367                       output_invalid (*l),
5368                       i.operands + 1);
5369               return NULL;
5370             }
5371           if (!intel_syntax)
5372             {
5373               if (*l == '(')
5374                 ++paren_not_balanced;
5375               if (*l == ')')
5376                 --paren_not_balanced;
5377             }
5378           else
5379             {
5380               if (*l == '[')
5381                 ++paren_not_balanced;
5382               if (*l == ']')
5383                 --paren_not_balanced;
5384             }
5385           l++;
5386         }
5387       if (l != token_start)
5388         {                       /* Yes, we've read in another operand.  */
5389           unsigned int operand_ok;
5390           this_operand = i.operands++;
5391           if (i.operands > MAX_OPERANDS)
5392             {
5393               as_bad (_("spurious operands; (%d operands/instruction max)"),
5394                       MAX_OPERANDS);
5395               return NULL;
5396             }
5397           i.types[this_operand].bitfield.unspecified = 1;
5398           /* Now parse operand adding info to 'i' as we go along.  */
5399           END_STRING_AND_SAVE (l);
5400
5401           if (i.mem_operands > 1)
5402             {
5403               as_bad (_("too many memory references for `%s'"),
5404                       mnemonic);
5405               return 0;
5406             }
5407
5408           if (intel_syntax)
5409             operand_ok =
5410               i386_intel_operand (token_start,
5411                                   intel_float_operand (mnemonic));
5412           else
5413             operand_ok = i386_att_operand (token_start);
5414
5415           RESTORE_END_STRING (l);
5416           if (!operand_ok)
5417             return NULL;
5418         }
5419       else
5420         {
5421           if (expecting_operand)
5422             {
5423             expecting_operand_after_comma:
5424               as_bad (_("expecting operand after ','; got nothing"));
5425               return NULL;
5426             }
5427           if (*l == ',')
5428             {
5429               as_bad (_("expecting operand before ','; got nothing"));
5430               return NULL;
5431             }
5432         }
5433
5434       /* Now *l must be either ',' or END_OF_INSN.  */
5435       if (*l == ',')
5436         {
5437           if (*++l == END_OF_INSN)
5438             {
5439               /* Just skip it, if it's \n complain.  */
5440               goto expecting_operand_after_comma;
5441             }
5442           expecting_operand = 1;
5443         }
5444     }
5445   return l;
5446 }
5447
5448 static void
5449 swap_2_operands (int xchg1, int xchg2)
5450 {
5451   union i386_op temp_op;
5452   i386_operand_type temp_type;
5453   unsigned int temp_flags;
5454   enum bfd_reloc_code_real temp_reloc;
5455
5456   temp_type = i.types[xchg2];
5457   i.types[xchg2] = i.types[xchg1];
5458   i.types[xchg1] = temp_type;
5459
5460   temp_flags = i.flags[xchg2];
5461   i.flags[xchg2] = i.flags[xchg1];
5462   i.flags[xchg1] = temp_flags;
5463
5464   temp_op = i.op[xchg2];
5465   i.op[xchg2] = i.op[xchg1];
5466   i.op[xchg1] = temp_op;
5467
5468   temp_reloc = i.reloc[xchg2];
5469   i.reloc[xchg2] = i.reloc[xchg1];
5470   i.reloc[xchg1] = temp_reloc;
5471
5472   if (i.mask)
5473     {
5474       if (i.mask->operand == xchg1)
5475         i.mask->operand = xchg2;
5476       else if (i.mask->operand == xchg2)
5477         i.mask->operand = xchg1;
5478     }
5479   if (i.broadcast)
5480     {
5481       if (i.broadcast->operand == xchg1)
5482         i.broadcast->operand = xchg2;
5483       else if (i.broadcast->operand == xchg2)
5484         i.broadcast->operand = xchg1;
5485     }
5486   if (i.rounding)
5487     {
5488       if (i.rounding->operand == xchg1)
5489         i.rounding->operand = xchg2;
5490       else if (i.rounding->operand == xchg2)
5491         i.rounding->operand = xchg1;
5492     }
5493 }
5494
5495 static void
5496 swap_operands (void)
5497 {
5498   switch (i.operands)
5499     {
5500     case 5:
5501     case 4:
5502       swap_2_operands (1, i.operands - 2);
5503       /* Fall through.  */
5504     case 3:
5505     case 2:
5506       swap_2_operands (0, i.operands - 1);
5507       break;
5508     default:
5509       abort ();
5510     }
5511
5512   if (i.mem_operands == 2)
5513     {
5514       const seg_entry *temp_seg;
5515       temp_seg = i.seg[0];
5516       i.seg[0] = i.seg[1];
5517       i.seg[1] = temp_seg;
5518     }
5519 }
5520
5521 /* Try to ensure constant immediates are represented in the smallest
5522    opcode possible.  */
5523 static void
5524 optimize_imm (void)
5525 {
5526   char guess_suffix = 0;
5527   int op;
5528
5529   if (i.suffix)
5530     guess_suffix = i.suffix;
5531   else if (i.reg_operands)
5532     {
5533       /* Figure out a suffix from the last register operand specified.
5534          We can't do this properly yet, i.e. excluding special register
5535          instances, but the following works for instructions with
5536          immediates.  In any case, we can't set i.suffix yet.  */
5537       for (op = i.operands; --op >= 0;)
5538         if (i.types[op].bitfield.class != Reg)
5539           continue;
5540         else if (i.types[op].bitfield.byte)
5541           {
5542             guess_suffix = BYTE_MNEM_SUFFIX;
5543             break;
5544           }
5545         else if (i.types[op].bitfield.word)
5546           {
5547             guess_suffix = WORD_MNEM_SUFFIX;
5548             break;
5549           }
5550         else if (i.types[op].bitfield.dword)
5551           {
5552             guess_suffix = LONG_MNEM_SUFFIX;
5553             break;
5554           }
5555         else if (i.types[op].bitfield.qword)
5556           {
5557             guess_suffix = QWORD_MNEM_SUFFIX;
5558             break;
5559           }
5560     }
5561   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5562     guess_suffix = WORD_MNEM_SUFFIX;
5563
5564   for (op = i.operands; --op >= 0;)
5565     if (operand_type_check (i.types[op], imm))
5566       {
5567         switch (i.op[op].imms->X_op)
5568           {
5569           case O_constant:
5570             /* If a suffix is given, this operand may be shortened.  */
5571             switch (guess_suffix)
5572               {
5573               case LONG_MNEM_SUFFIX:
5574                 i.types[op].bitfield.imm32 = 1;
5575                 i.types[op].bitfield.imm64 = 1;
5576                 break;
5577               case WORD_MNEM_SUFFIX:
5578                 i.types[op].bitfield.imm16 = 1;
5579                 i.types[op].bitfield.imm32 = 1;
5580                 i.types[op].bitfield.imm32s = 1;
5581                 i.types[op].bitfield.imm64 = 1;
5582                 break;
5583               case BYTE_MNEM_SUFFIX:
5584                 i.types[op].bitfield.imm8 = 1;
5585                 i.types[op].bitfield.imm8s = 1;
5586                 i.types[op].bitfield.imm16 = 1;
5587                 i.types[op].bitfield.imm32 = 1;
5588                 i.types[op].bitfield.imm32s = 1;
5589                 i.types[op].bitfield.imm64 = 1;
5590                 break;
5591               }
5592
5593             /* If this operand is at most 16 bits, convert it
5594                to a signed 16 bit number before trying to see
5595                whether it will fit in an even smaller size.
5596                This allows a 16-bit operand such as $0xffe0 to
5597                be recognised as within Imm8S range.  */
5598             if ((i.types[op].bitfield.imm16)
5599                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5600               {
5601                 i.op[op].imms->X_add_number =
5602                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5603               }
5604 #ifdef BFD64
5605             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5606             if ((i.types[op].bitfield.imm32)
5607                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5608                     == 0))
5609               {
5610                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5611                                                 ^ ((offsetT) 1 << 31))
5612                                                - ((offsetT) 1 << 31));
5613               }
5614 #endif
5615             i.types[op]
5616               = operand_type_or (i.types[op],
5617                                  smallest_imm_type (i.op[op].imms->X_add_number));
5618
5619             /* We must avoid matching of Imm32 templates when 64bit
5620                only immediate is available.  */
5621             if (guess_suffix == QWORD_MNEM_SUFFIX)
5622               i.types[op].bitfield.imm32 = 0;
5623             break;
5624
5625           case O_absent:
5626           case O_register:
5627             abort ();
5628
5629             /* Symbols and expressions.  */
5630           default:
5631             /* Convert symbolic operand to proper sizes for matching, but don't
5632                prevent matching a set of insns that only supports sizes other
5633                than those matching the insn suffix.  */
5634             {
5635               i386_operand_type mask, allowed;
5636               const insn_template *t;
5637
5638               operand_type_set (&mask, 0);
5639               operand_type_set (&allowed, 0);
5640
5641               for (t = current_templates->start;
5642                    t < current_templates->end;
5643                    ++t)
5644                 {
5645                   allowed = operand_type_or (allowed, t->operand_types[op]);
5646                   allowed = operand_type_and (allowed, anyimm);
5647                 }
5648               switch (guess_suffix)
5649                 {
5650                 case QWORD_MNEM_SUFFIX:
5651                   mask.bitfield.imm64 = 1;
5652                   mask.bitfield.imm32s = 1;
5653                   break;
5654                 case LONG_MNEM_SUFFIX:
5655                   mask.bitfield.imm32 = 1;
5656                   break;
5657                 case WORD_MNEM_SUFFIX:
5658                   mask.bitfield.imm16 = 1;
5659                   break;
5660                 case BYTE_MNEM_SUFFIX:
5661                   mask.bitfield.imm8 = 1;
5662                   break;
5663                 default:
5664                   break;
5665                 }
5666               allowed = operand_type_and (mask, allowed);
5667               if (!operand_type_all_zero (&allowed))
5668                 i.types[op] = operand_type_and (i.types[op], mask);
5669             }
5670             break;
5671           }
5672       }
5673 }
5674
5675 /* Try to use the smallest displacement type too.  */
5676 static void
5677 optimize_disp (void)
5678 {
5679   int op;
5680
5681   for (op = i.operands; --op >= 0;)
5682     if (operand_type_check (i.types[op], disp))
5683       {
5684         if (i.op[op].disps->X_op == O_constant)
5685           {
5686             offsetT op_disp = i.op[op].disps->X_add_number;
5687
5688             if (i.types[op].bitfield.disp16
5689                 && (op_disp & ~(offsetT) 0xffff) == 0)
5690               {
5691                 /* If this operand is at most 16 bits, convert
5692                    to a signed 16 bit number and don't use 64bit
5693                    displacement.  */
5694                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5695                 i.types[op].bitfield.disp64 = 0;
5696               }
5697 #ifdef BFD64
5698             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5699             if (i.types[op].bitfield.disp32
5700                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5701               {
5702                 /* If this operand is at most 32 bits, convert
5703                    to a signed 32 bit number and don't use 64bit
5704                    displacement.  */
5705                 op_disp &= (((offsetT) 2 << 31) - 1);
5706                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5707                 i.types[op].bitfield.disp64 = 0;
5708               }
5709 #endif
5710             if (!op_disp && i.types[op].bitfield.baseindex)
5711               {
5712                 i.types[op].bitfield.disp8 = 0;
5713                 i.types[op].bitfield.disp16 = 0;
5714                 i.types[op].bitfield.disp32 = 0;
5715                 i.types[op].bitfield.disp32s = 0;
5716                 i.types[op].bitfield.disp64 = 0;
5717                 i.op[op].disps = 0;
5718                 i.disp_operands--;
5719               }
5720             else if (flag_code == CODE_64BIT)
5721               {
5722                 if (fits_in_signed_long (op_disp))
5723                   {
5724                     i.types[op].bitfield.disp64 = 0;
5725                     i.types[op].bitfield.disp32s = 1;
5726                   }
5727                 if (i.prefix[ADDR_PREFIX]
5728                     && fits_in_unsigned_long (op_disp))
5729                   i.types[op].bitfield.disp32 = 1;
5730               }
5731             if ((i.types[op].bitfield.disp32
5732                  || i.types[op].bitfield.disp32s
5733                  || i.types[op].bitfield.disp16)
5734                 && fits_in_disp8 (op_disp))
5735               i.types[op].bitfield.disp8 = 1;
5736           }
5737         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5738                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5739           {
5740             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5741                          i.op[op].disps, 0, i.reloc[op]);
5742             i.types[op].bitfield.disp8 = 0;
5743             i.types[op].bitfield.disp16 = 0;
5744             i.types[op].bitfield.disp32 = 0;
5745             i.types[op].bitfield.disp32s = 0;
5746             i.types[op].bitfield.disp64 = 0;
5747           }
5748         else
5749           /* We only support 64bit displacement on constants.  */
5750           i.types[op].bitfield.disp64 = 0;
5751       }
5752 }
5753
5754 /* Return 1 if there is a match in broadcast bytes between operand
5755    GIVEN and instruction template T.   */
5756
5757 static INLINE int
5758 match_broadcast_size (const insn_template *t, unsigned int given)
5759 {
5760   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5761            && i.types[given].bitfield.byte)
5762           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5763               && i.types[given].bitfield.word)
5764           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5765               && i.types[given].bitfield.dword)
5766           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5767               && i.types[given].bitfield.qword));
5768 }
5769
5770 /* Check if operands are valid for the instruction.  */
5771
5772 static int
5773 check_VecOperands (const insn_template *t)
5774 {
5775   unsigned int op;
5776   i386_cpu_flags cpu;
5777
5778   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5779      any one operand are implicity requiring AVX512VL support if the actual
5780      operand size is YMMword or XMMword.  Since this function runs after
5781      template matching, there's no need to check for YMMword/XMMword in
5782      the template.  */
5783   cpu = cpu_flags_and (t->cpu_flags, avx512);
5784   if (!cpu_flags_all_zero (&cpu)
5785       && !t->cpu_flags.bitfield.cpuavx512vl
5786       && !cpu_arch_flags.bitfield.cpuavx512vl)
5787     {
5788       for (op = 0; op < t->operands; ++op)
5789         {
5790           if (t->operand_types[op].bitfield.zmmword
5791               && (i.types[op].bitfield.ymmword
5792                   || i.types[op].bitfield.xmmword))
5793             {
5794               i.error = unsupported;
5795               return 1;
5796             }
5797         }
5798     }
5799
5800   /* Without VSIB byte, we can't have a vector register for index.  */
5801   if (!t->opcode_modifier.sib
5802       && i.index_reg
5803       && (i.index_reg->reg_type.bitfield.xmmword
5804           || i.index_reg->reg_type.bitfield.ymmword
5805           || i.index_reg->reg_type.bitfield.zmmword))
5806     {
5807       i.error = unsupported_vector_index_register;
5808       return 1;
5809     }
5810
5811   /* Check if default mask is allowed.  */
5812   if (t->opcode_modifier.nodefmask
5813       && (!i.mask || i.mask->mask->reg_num == 0))
5814     {
5815       i.error = no_default_mask;
5816       return 1;
5817     }
5818
5819   /* For VSIB byte, we need a vector register for index, and all vector
5820      registers must be distinct.  */
5821   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5822     {
5823       if (!i.index_reg
5824           || !((t->opcode_modifier.sib == VECSIB128
5825                 && i.index_reg->reg_type.bitfield.xmmword)
5826                || (t->opcode_modifier.sib == VECSIB256
5827                    && i.index_reg->reg_type.bitfield.ymmword)
5828                || (t->opcode_modifier.sib == VECSIB512
5829                    && i.index_reg->reg_type.bitfield.zmmword)))
5830       {
5831         i.error = invalid_vsib_address;
5832         return 1;
5833       }
5834
5835       gas_assert (i.reg_operands == 2 || i.mask);
5836       if (i.reg_operands == 2 && !i.mask)
5837         {
5838           gas_assert (i.types[0].bitfield.class == RegSIMD);
5839           gas_assert (i.types[0].bitfield.xmmword
5840                       || i.types[0].bitfield.ymmword);
5841           gas_assert (i.types[2].bitfield.class == RegSIMD);
5842           gas_assert (i.types[2].bitfield.xmmword
5843                       || i.types[2].bitfield.ymmword);
5844           if (operand_check == check_none)
5845             return 0;
5846           if (register_number (i.op[0].regs)
5847               != register_number (i.index_reg)
5848               && register_number (i.op[2].regs)
5849                  != register_number (i.index_reg)
5850               && register_number (i.op[0].regs)
5851                  != register_number (i.op[2].regs))
5852             return 0;
5853           if (operand_check == check_error)
5854             {
5855               i.error = invalid_vector_register_set;
5856               return 1;
5857             }
5858           as_warn (_("mask, index, and destination registers should be distinct"));
5859         }
5860       else if (i.reg_operands == 1 && i.mask)
5861         {
5862           if (i.types[1].bitfield.class == RegSIMD
5863               && (i.types[1].bitfield.xmmword
5864                   || i.types[1].bitfield.ymmword
5865                   || i.types[1].bitfield.zmmword)
5866               && (register_number (i.op[1].regs)
5867                   == register_number (i.index_reg)))
5868             {
5869               if (operand_check == check_error)
5870                 {
5871                   i.error = invalid_vector_register_set;
5872                   return 1;
5873                 }
5874               if (operand_check != check_none)
5875                 as_warn (_("index and destination registers should be distinct"));
5876             }
5877         }
5878     }
5879
5880   /* For AMX instructions with three tmmword operands, all tmmword operand must be
5881      distinct */
5882   if (t->operand_types[0].bitfield.tmmword
5883       && i.reg_operands == 3)
5884     {
5885       if (register_number (i.op[0].regs)
5886           == register_number (i.op[1].regs)
5887           || register_number (i.op[0].regs)
5888              == register_number (i.op[2].regs)
5889           || register_number (i.op[1].regs)
5890              == register_number (i.op[2].regs))
5891         {
5892           i.error = invalid_tmm_register_set;
5893           return 1;
5894         }
5895     }
5896
5897   /* Check if broadcast is supported by the instruction and is applied
5898      to the memory operand.  */
5899   if (i.broadcast)
5900     {
5901       i386_operand_type type, overlap;
5902
5903       /* Check if specified broadcast is supported in this instruction,
5904          and its broadcast bytes match the memory operand.  */
5905       op = i.broadcast->operand;
5906       if (!t->opcode_modifier.broadcast
5907           || !(i.flags[op] & Operand_Mem)
5908           || (!i.types[op].bitfield.unspecified
5909               && !match_broadcast_size (t, op)))
5910         {
5911         bad_broadcast:
5912           i.error = unsupported_broadcast;
5913           return 1;
5914         }
5915
5916       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5917                             * i.broadcast->type);
5918       operand_type_set (&type, 0);
5919       switch (i.broadcast->bytes)
5920         {
5921         case 2:
5922           type.bitfield.word = 1;
5923           break;
5924         case 4:
5925           type.bitfield.dword = 1;
5926           break;
5927         case 8:
5928           type.bitfield.qword = 1;
5929           break;
5930         case 16:
5931           type.bitfield.xmmword = 1;
5932           break;
5933         case 32:
5934           type.bitfield.ymmword = 1;
5935           break;
5936         case 64:
5937           type.bitfield.zmmword = 1;
5938           break;
5939         default:
5940           goto bad_broadcast;
5941         }
5942
5943       overlap = operand_type_and (type, t->operand_types[op]);
5944       if (t->operand_types[op].bitfield.class == RegSIMD
5945           && t->operand_types[op].bitfield.byte
5946              + t->operand_types[op].bitfield.word
5947              + t->operand_types[op].bitfield.dword
5948              + t->operand_types[op].bitfield.qword > 1)
5949         {
5950           overlap.bitfield.xmmword = 0;
5951           overlap.bitfield.ymmword = 0;
5952           overlap.bitfield.zmmword = 0;
5953         }
5954       if (operand_type_all_zero (&overlap))
5955           goto bad_broadcast;
5956
5957       if (t->opcode_modifier.checkregsize)
5958         {
5959           unsigned int j;
5960
5961           type.bitfield.baseindex = 1;
5962           for (j = 0; j < i.operands; ++j)
5963             {
5964               if (j != op
5965                   && !operand_type_register_match(i.types[j],
5966                                                   t->operand_types[j],
5967                                                   type,
5968                                                   t->operand_types[op]))
5969                 goto bad_broadcast;
5970             }
5971         }
5972     }
5973   /* If broadcast is supported in this instruction, we need to check if
5974      operand of one-element size isn't specified without broadcast.  */
5975   else if (t->opcode_modifier.broadcast && i.mem_operands)
5976     {
5977       /* Find memory operand.  */
5978       for (op = 0; op < i.operands; op++)
5979         if (i.flags[op] & Operand_Mem)
5980           break;
5981       gas_assert (op < i.operands);
5982       /* Check size of the memory operand.  */
5983       if (match_broadcast_size (t, op))
5984         {
5985           i.error = broadcast_needed;
5986           return 1;
5987         }
5988     }
5989   else
5990     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5991
5992   /* Check if requested masking is supported.  */
5993   if (i.mask)
5994     {
5995       switch (t->opcode_modifier.masking)
5996         {
5997         case BOTH_MASKING:
5998           break;
5999         case MERGING_MASKING:
6000           if (i.mask->zeroing)
6001             {
6002         case 0:
6003               i.error = unsupported_masking;
6004               return 1;
6005             }
6006           break;
6007         case DYNAMIC_MASKING:
6008           /* Memory destinations allow only merging masking.  */
6009           if (i.mask->zeroing && i.mem_operands)
6010             {
6011               /* Find memory operand.  */
6012               for (op = 0; op < i.operands; op++)
6013                 if (i.flags[op] & Operand_Mem)
6014                   break;
6015               gas_assert (op < i.operands);
6016               if (op == i.operands - 1)
6017                 {
6018                   i.error = unsupported_masking;
6019                   return 1;
6020                 }
6021             }
6022           break;
6023         default:
6024           abort ();
6025         }
6026     }
6027
6028   /* Check if masking is applied to dest operand.  */
6029   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6030     {
6031       i.error = mask_not_on_destination;
6032       return 1;
6033     }
6034
6035   /* Check RC/SAE.  */
6036   if (i.rounding)
6037     {
6038       if (!t->opcode_modifier.sae
6039           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6040         {
6041           i.error = unsupported_rc_sae;
6042           return 1;
6043         }
6044       /* If the instruction has several immediate operands and one of
6045          them is rounding, the rounding operand should be the last
6046          immediate operand.  */
6047       if (i.imm_operands > 1
6048           && i.rounding->operand != (int) (i.imm_operands - 1))
6049         {
6050           i.error = rc_sae_operand_not_last_imm;
6051           return 1;
6052         }
6053     }
6054
6055   /* Check the special Imm4 cases; must be the first operand.  */
6056   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6057     {
6058       if (i.op[0].imms->X_op != O_constant
6059           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6060         {
6061           i.error = bad_imm4;
6062           return 1;
6063         }
6064
6065       /* Turn off Imm<N> so that update_imm won't complain.  */
6066       operand_type_set (&i.types[0], 0);
6067     }
6068
6069   /* Check vector Disp8 operand.  */
6070   if (t->opcode_modifier.disp8memshift
6071       && i.disp_encoding != disp_encoding_32bit)
6072     {
6073       if (i.broadcast)
6074         i.memshift = t->opcode_modifier.broadcast - 1;
6075       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6076         i.memshift = t->opcode_modifier.disp8memshift;
6077       else
6078         {
6079           const i386_operand_type *type = NULL;
6080
6081           i.memshift = 0;
6082           for (op = 0; op < i.operands; op++)
6083             if (i.flags[op] & Operand_Mem)
6084               {
6085                 if (t->opcode_modifier.evex == EVEXLIG)
6086                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6087                 else if (t->operand_types[op].bitfield.xmmword
6088                          + t->operand_types[op].bitfield.ymmword
6089                          + t->operand_types[op].bitfield.zmmword <= 1)
6090                   type = &t->operand_types[op];
6091                 else if (!i.types[op].bitfield.unspecified)
6092                   type = &i.types[op];
6093               }
6094             else if (i.types[op].bitfield.class == RegSIMD
6095                      && t->opcode_modifier.evex != EVEXLIG)
6096               {
6097                 if (i.types[op].bitfield.zmmword)
6098                   i.memshift = 6;
6099                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6100                   i.memshift = 5;
6101                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6102                   i.memshift = 4;
6103               }
6104
6105           if (type)
6106             {
6107               if (type->bitfield.zmmword)
6108                 i.memshift = 6;
6109               else if (type->bitfield.ymmword)
6110                 i.memshift = 5;
6111               else if (type->bitfield.xmmword)
6112                 i.memshift = 4;
6113             }
6114
6115           /* For the check in fits_in_disp8().  */
6116           if (i.memshift == 0)
6117             i.memshift = -1;
6118         }
6119
6120       for (op = 0; op < i.operands; op++)
6121         if (operand_type_check (i.types[op], disp)
6122             && i.op[op].disps->X_op == O_constant)
6123           {
6124             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6125               {
6126                 i.types[op].bitfield.disp8 = 1;
6127                 return 0;
6128               }
6129             i.types[op].bitfield.disp8 = 0;
6130           }
6131     }
6132
6133   i.memshift = 0;
6134
6135   return 0;
6136 }
6137
6138 /* Check if encoding requirements are met by the instruction.  */
6139
6140 static int
6141 VEX_check_encoding (const insn_template *t)
6142 {
6143   if (i.vec_encoding == vex_encoding_error)
6144     {
6145       i.error = unsupported;
6146       return 1;
6147     }
6148
6149   if (i.vec_encoding == vex_encoding_evex)
6150     {
6151       /* This instruction must be encoded with EVEX prefix.  */
6152       if (!is_evex_encoding (t))
6153         {
6154           i.error = unsupported;
6155           return 1;
6156         }
6157       return 0;
6158     }
6159
6160   if (!t->opcode_modifier.vex)
6161     {
6162       /* This instruction template doesn't have VEX prefix.  */
6163       if (i.vec_encoding != vex_encoding_default)
6164         {
6165           i.error = unsupported;
6166           return 1;
6167         }
6168       return 0;
6169     }
6170
6171   return 0;
6172 }
6173
6174 static const insn_template *
6175 match_template (char mnem_suffix)
6176 {
6177   /* Points to template once we've found it.  */
6178   const insn_template *t;
6179   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6180   i386_operand_type overlap4;
6181   unsigned int found_reverse_match;
6182   i386_opcode_modifier suffix_check;
6183   i386_operand_type operand_types [MAX_OPERANDS];
6184   int addr_prefix_disp;
6185   unsigned int j, size_match, check_register;
6186   enum i386_error specific_error = 0;
6187
6188 #if MAX_OPERANDS != 5
6189 # error "MAX_OPERANDS must be 5."
6190 #endif
6191
6192   found_reverse_match = 0;
6193   addr_prefix_disp = -1;
6194
6195   /* Prepare for mnemonic suffix check.  */
6196   memset (&suffix_check, 0, sizeof (suffix_check));
6197   switch (mnem_suffix)
6198     {
6199     case BYTE_MNEM_SUFFIX:
6200       suffix_check.no_bsuf = 1;
6201       break;
6202     case WORD_MNEM_SUFFIX:
6203       suffix_check.no_wsuf = 1;
6204       break;
6205     case SHORT_MNEM_SUFFIX:
6206       suffix_check.no_ssuf = 1;
6207       break;
6208     case LONG_MNEM_SUFFIX:
6209       suffix_check.no_lsuf = 1;
6210       break;
6211     case QWORD_MNEM_SUFFIX:
6212       suffix_check.no_qsuf = 1;
6213       break;
6214     default:
6215       /* NB: In Intel syntax, normally we can check for memory operand
6216          size when there is no mnemonic suffix.  But jmp and call have
6217          2 different encodings with Dword memory operand size, one with
6218          No_ldSuf and the other without.  i.suffix is set to
6219          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6220       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6221         suffix_check.no_ldsuf = 1;
6222     }
6223
6224   /* Must have right number of operands.  */
6225   i.error = number_of_operands_mismatch;
6226
6227   for (t = current_templates->start; t < current_templates->end; t++)
6228     {
6229       addr_prefix_disp = -1;
6230       found_reverse_match = 0;
6231
6232       if (i.operands != t->operands)
6233         continue;
6234
6235       /* Check processor support.  */
6236       i.error = unsupported;
6237       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6238         continue;
6239
6240       /* Check AT&T mnemonic.   */
6241       i.error = unsupported_with_intel_mnemonic;
6242       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6243         continue;
6244
6245       /* Check AT&T/Intel syntax.  */
6246       i.error = unsupported_syntax;
6247       if ((intel_syntax && t->opcode_modifier.attsyntax)
6248           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6249         continue;
6250
6251       /* Check Intel64/AMD64 ISA.   */
6252       switch (isa64)
6253         {
6254         default:
6255           /* Default: Don't accept Intel64.  */
6256           if (t->opcode_modifier.isa64 == INTEL64)
6257             continue;
6258           break;
6259         case amd64:
6260           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6261           if (t->opcode_modifier.isa64 >= INTEL64)
6262             continue;
6263           break;
6264         case intel64:
6265           /* -mintel64: Don't accept AMD64.  */
6266           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6267             continue;
6268           break;
6269         }
6270
6271       /* Check the suffix.  */
6272       i.error = invalid_instruction_suffix;
6273       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6274           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6275           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6276           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6277           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6278           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6279         continue;
6280
6281       size_match = operand_size_match (t);
6282       if (!size_match)
6283         continue;
6284
6285       /* This is intentionally not
6286
6287          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6288
6289          as the case of a missing * on the operand is accepted (perhaps with
6290          a warning, issued further down).  */
6291       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6292         {
6293           i.error = operand_type_mismatch;
6294           continue;
6295         }
6296
6297       for (j = 0; j < MAX_OPERANDS; j++)
6298         operand_types[j] = t->operand_types[j];
6299
6300       /* In general, don't allow
6301          - 64-bit operands outside of 64-bit mode,
6302          - 32-bit operands on pre-386.  */
6303       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6304       if (((i.suffix == QWORD_MNEM_SUFFIX
6305             && flag_code != CODE_64BIT
6306             && (t->base_opcode != 0x0fc7
6307                 || t->extension_opcode != 1 /* cmpxchg8b */))
6308            || (i.suffix == LONG_MNEM_SUFFIX
6309                && !cpu_arch_flags.bitfield.cpui386))
6310           && (intel_syntax
6311               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6312                  && !intel_float_operand (t->name))
6313               : intel_float_operand (t->name) != 2)
6314           && (t->operands == i.imm_operands
6315               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6316                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6317                && operand_types[i.imm_operands].bitfield.class != RegMask)
6318               || (operand_types[j].bitfield.class != RegMMX
6319                   && operand_types[j].bitfield.class != RegSIMD
6320                   && operand_types[j].bitfield.class != RegMask))
6321           && !t->opcode_modifier.sib)
6322         continue;
6323
6324       /* Do not verify operands when there are none.  */
6325       if (!t->operands)
6326         {
6327           if (VEX_check_encoding (t))
6328             {
6329               specific_error = i.error;
6330               continue;
6331             }
6332
6333           /* We've found a match; break out of loop.  */
6334           break;
6335         }
6336
6337       if (!t->opcode_modifier.jump
6338           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6339         {
6340           /* There should be only one Disp operand.  */
6341           for (j = 0; j < MAX_OPERANDS; j++)
6342             if (operand_type_check (operand_types[j], disp))
6343               break;
6344           if (j < MAX_OPERANDS)
6345             {
6346               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6347
6348               addr_prefix_disp = j;
6349
6350               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6351                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6352               switch (flag_code)
6353                 {
6354                 case CODE_16BIT:
6355                   override = !override;
6356                   /* Fall through.  */
6357                 case CODE_32BIT:
6358                   if (operand_types[j].bitfield.disp32
6359                       && operand_types[j].bitfield.disp16)
6360                     {
6361                       operand_types[j].bitfield.disp16 = override;
6362                       operand_types[j].bitfield.disp32 = !override;
6363                     }
6364                   operand_types[j].bitfield.disp32s = 0;
6365                   operand_types[j].bitfield.disp64 = 0;
6366                   break;
6367
6368                 case CODE_64BIT:
6369                   if (operand_types[j].bitfield.disp32s
6370                       || operand_types[j].bitfield.disp64)
6371                     {
6372                       operand_types[j].bitfield.disp64 &= !override;
6373                       operand_types[j].bitfield.disp32s &= !override;
6374                       operand_types[j].bitfield.disp32 = override;
6375                     }
6376                   operand_types[j].bitfield.disp16 = 0;
6377                   break;
6378                 }
6379             }
6380         }
6381
6382       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6383       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6384         continue;
6385
6386       /* We check register size if needed.  */
6387       if (t->opcode_modifier.checkregsize)
6388         {
6389           check_register = (1 << t->operands) - 1;
6390           if (i.broadcast)
6391             check_register &= ~(1 << i.broadcast->operand);
6392         }
6393       else
6394         check_register = 0;
6395
6396       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6397       switch (t->operands)
6398         {
6399         case 1:
6400           if (!operand_type_match (overlap0, i.types[0]))
6401             continue;
6402           break;
6403         case 2:
6404           /* xchg %eax, %eax is a special case. It is an alias for nop
6405              only in 32bit mode and we can use opcode 0x90.  In 64bit
6406              mode, we can't use 0x90 for xchg %eax, %eax since it should
6407              zero-extend %eax to %rax.  */
6408           if (flag_code == CODE_64BIT
6409               && t->base_opcode == 0x90
6410               && i.types[0].bitfield.instance == Accum
6411               && i.types[0].bitfield.dword
6412               && i.types[1].bitfield.instance == Accum
6413               && i.types[1].bitfield.dword)
6414             continue;
6415           /* xrelease mov %eax, <disp> is another special case. It must not
6416              match the accumulator-only encoding of mov.  */
6417           if (flag_code != CODE_64BIT
6418               && i.hle_prefix
6419               && t->base_opcode == 0xa0
6420               && i.types[0].bitfield.instance == Accum
6421               && (i.flags[1] & Operand_Mem))
6422             continue;
6423           /* Fall through.  */
6424
6425         case 3:
6426           if (!(size_match & MATCH_STRAIGHT))
6427             goto check_reverse;
6428           /* Reverse direction of operands if swapping is possible in the first
6429              place (operands need to be symmetric) and
6430              - the load form is requested, and the template is a store form,
6431              - the store form is requested, and the template is a load form,
6432              - the non-default (swapped) form is requested.  */
6433           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6434           if (t->opcode_modifier.d && i.reg_operands == i.operands
6435               && !operand_type_all_zero (&overlap1))
6436             switch (i.dir_encoding)
6437               {
6438               case dir_encoding_load:
6439                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6440                     || t->opcode_modifier.regmem)
6441                   goto check_reverse;
6442                 break;
6443
6444               case dir_encoding_store:
6445                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6446                     && !t->opcode_modifier.regmem)
6447                   goto check_reverse;
6448                 break;
6449
6450               case dir_encoding_swap:
6451                 goto check_reverse;
6452
6453               case dir_encoding_default:
6454                 break;
6455               }
6456           /* If we want store form, we skip the current load.  */
6457           if ((i.dir_encoding == dir_encoding_store
6458                || i.dir_encoding == dir_encoding_swap)
6459               && i.mem_operands == 0
6460               && t->opcode_modifier.load)
6461             continue;
6462           /* Fall through.  */
6463         case 4:
6464         case 5:
6465           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6466           if (!operand_type_match (overlap0, i.types[0])
6467               || !operand_type_match (overlap1, i.types[1])
6468               || ((check_register & 3) == 3
6469                   && !operand_type_register_match (i.types[0],
6470                                                    operand_types[0],
6471                                                    i.types[1],
6472                                                    operand_types[1])))
6473             {
6474               /* Check if other direction is valid ...  */
6475               if (!t->opcode_modifier.d)
6476                 continue;
6477
6478             check_reverse:
6479               if (!(size_match & MATCH_REVERSE))
6480                 continue;
6481               /* Try reversing direction of operands.  */
6482               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6483               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6484               if (!operand_type_match (overlap0, i.types[0])
6485                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6486                   || (check_register
6487                       && !operand_type_register_match (i.types[0],
6488                                                        operand_types[i.operands - 1],
6489                                                        i.types[i.operands - 1],
6490                                                        operand_types[0])))
6491                 {
6492                   /* Does not match either direction.  */
6493                   continue;
6494                 }
6495               /* found_reverse_match holds which of D or FloatR
6496                  we've found.  */
6497               if (!t->opcode_modifier.d)
6498                 found_reverse_match = 0;
6499               else if (operand_types[0].bitfield.tbyte)
6500                 found_reverse_match = Opcode_FloatD;
6501               else if (operand_types[0].bitfield.xmmword
6502                        || operand_types[i.operands - 1].bitfield.xmmword
6503                        || operand_types[0].bitfield.class == RegMMX
6504                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6505                        || is_any_vex_encoding(t))
6506                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6507                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6508               else
6509                 found_reverse_match = Opcode_D;
6510               if (t->opcode_modifier.floatr)
6511                 found_reverse_match |= Opcode_FloatR;
6512             }
6513           else
6514             {
6515               /* Found a forward 2 operand match here.  */
6516               switch (t->operands)
6517                 {
6518                 case 5:
6519                   overlap4 = operand_type_and (i.types[4],
6520                                                operand_types[4]);
6521                   /* Fall through.  */
6522                 case 4:
6523                   overlap3 = operand_type_and (i.types[3],
6524                                                operand_types[3]);
6525                   /* Fall through.  */
6526                 case 3:
6527                   overlap2 = operand_type_and (i.types[2],
6528                                                operand_types[2]);
6529                   break;
6530                 }
6531
6532               switch (t->operands)
6533                 {
6534                 case 5:
6535                   if (!operand_type_match (overlap4, i.types[4])
6536                       || !operand_type_register_match (i.types[3],
6537                                                        operand_types[3],
6538                                                        i.types[4],
6539                                                        operand_types[4]))
6540                     continue;
6541                   /* Fall through.  */
6542                 case 4:
6543                   if (!operand_type_match (overlap3, i.types[3])
6544                       || ((check_register & 0xa) == 0xa
6545                           && !operand_type_register_match (i.types[1],
6546                                                             operand_types[1],
6547                                                             i.types[3],
6548                                                             operand_types[3]))
6549                       || ((check_register & 0xc) == 0xc
6550                           && !operand_type_register_match (i.types[2],
6551                                                             operand_types[2],
6552                                                             i.types[3],
6553                                                             operand_types[3])))
6554                     continue;
6555                   /* Fall through.  */
6556                 case 3:
6557                   /* Here we make use of the fact that there are no
6558                      reverse match 3 operand instructions.  */
6559                   if (!operand_type_match (overlap2, i.types[2])
6560                       || ((check_register & 5) == 5
6561                           && !operand_type_register_match (i.types[0],
6562                                                             operand_types[0],
6563                                                             i.types[2],
6564                                                             operand_types[2]))
6565                       || ((check_register & 6) == 6
6566                           && !operand_type_register_match (i.types[1],
6567                                                             operand_types[1],
6568                                                             i.types[2],
6569                                                             operand_types[2])))
6570                     continue;
6571                   break;
6572                 }
6573             }
6574           /* Found either forward/reverse 2, 3 or 4 operand match here:
6575              slip through to break.  */
6576         }
6577
6578       /* Check if vector operands are valid.  */
6579       if (check_VecOperands (t))
6580         {
6581           specific_error = i.error;
6582           continue;
6583         }
6584
6585       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6586       if (VEX_check_encoding (t))
6587         {
6588           specific_error = i.error;
6589           continue;
6590         }
6591
6592       /* We've found a match; break out of loop.  */
6593       break;
6594     }
6595
6596   if (t == current_templates->end)
6597     {
6598       /* We found no match.  */
6599       const char *err_msg;
6600       switch (specific_error ? specific_error : i.error)
6601         {
6602         default:
6603           abort ();
6604         case operand_size_mismatch:
6605           err_msg = _("operand size mismatch");
6606           break;
6607         case operand_type_mismatch:
6608           err_msg = _("operand type mismatch");
6609           break;
6610         case register_type_mismatch:
6611           err_msg = _("register type mismatch");
6612           break;
6613         case number_of_operands_mismatch:
6614           err_msg = _("number of operands mismatch");
6615           break;
6616         case invalid_instruction_suffix:
6617           err_msg = _("invalid instruction suffix");
6618           break;
6619         case bad_imm4:
6620           err_msg = _("constant doesn't fit in 4 bits");
6621           break;
6622         case unsupported_with_intel_mnemonic:
6623           err_msg = _("unsupported with Intel mnemonic");
6624           break;
6625         case unsupported_syntax:
6626           err_msg = _("unsupported syntax");
6627           break;
6628         case unsupported:
6629           as_bad (_("unsupported instruction `%s'"),
6630                   current_templates->start->name);
6631           return NULL;
6632         case invalid_sib_address:
6633           err_msg = _("invalid SIB address");
6634           break;
6635         case invalid_vsib_address:
6636           err_msg = _("invalid VSIB address");
6637           break;
6638         case invalid_vector_register_set:
6639           err_msg = _("mask, index, and destination registers must be distinct");
6640           break;
6641         case invalid_tmm_register_set:
6642           err_msg = _("all tmm registers must be distinct");
6643           break;
6644         case unsupported_vector_index_register:
6645           err_msg = _("unsupported vector index register");
6646           break;
6647         case unsupported_broadcast:
6648           err_msg = _("unsupported broadcast");
6649           break;
6650         case broadcast_needed:
6651           err_msg = _("broadcast is needed for operand of such type");
6652           break;
6653         case unsupported_masking:
6654           err_msg = _("unsupported masking");
6655           break;
6656         case mask_not_on_destination:
6657           err_msg = _("mask not on destination operand");
6658           break;
6659         case no_default_mask:
6660           err_msg = _("default mask isn't allowed");
6661           break;
6662         case unsupported_rc_sae:
6663           err_msg = _("unsupported static rounding/sae");
6664           break;
6665         case rc_sae_operand_not_last_imm:
6666           if (intel_syntax)
6667             err_msg = _("RC/SAE operand must precede immediate operands");
6668           else
6669             err_msg = _("RC/SAE operand must follow immediate operands");
6670           break;
6671         case invalid_register_operand:
6672           err_msg = _("invalid register operand");
6673           break;
6674         }
6675       as_bad (_("%s for `%s'"), err_msg,
6676               current_templates->start->name);
6677       return NULL;
6678     }
6679
6680   if (!quiet_warnings)
6681     {
6682       if (!intel_syntax
6683           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6684         as_warn (_("indirect %s without `*'"), t->name);
6685
6686       if (t->opcode_modifier.isprefix
6687           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6688         {
6689           /* Warn them that a data or address size prefix doesn't
6690              affect assembly of the next line of code.  */
6691           as_warn (_("stand-alone `%s' prefix"), t->name);
6692         }
6693     }
6694
6695   /* Copy the template we found.  */
6696   i.tm = *t;
6697
6698   if (addr_prefix_disp != -1)
6699     i.tm.operand_types[addr_prefix_disp]
6700       = operand_types[addr_prefix_disp];
6701
6702   if (found_reverse_match)
6703     {
6704       /* If we found a reverse match we must alter the opcode direction
6705          bit and clear/flip the regmem modifier one.  found_reverse_match
6706          holds bits to change (different for int & float insns).  */
6707
6708       i.tm.base_opcode ^= found_reverse_match;
6709
6710       i.tm.operand_types[0] = operand_types[i.operands - 1];
6711       i.tm.operand_types[i.operands - 1] = operand_types[0];
6712
6713       /* Certain SIMD insns have their load forms specified in the opcode
6714          table, and hence we need to _set_ RegMem instead of clearing it.
6715          We need to avoid setting the bit though on insns like KMOVW.  */
6716       i.tm.opcode_modifier.regmem
6717         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6718           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6719           && !i.tm.opcode_modifier.regmem;
6720     }
6721
6722   return t;
6723 }
6724
6725 static int
6726 check_string (void)
6727 {
6728   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6729   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6730
6731   if (i.seg[op] != NULL && i.seg[op] != &es)
6732     {
6733       as_bad (_("`%s' operand %u must use `%ses' segment"),
6734               i.tm.name,
6735               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6736               register_prefix);
6737       return 0;
6738     }
6739
6740   /* There's only ever one segment override allowed per instruction.
6741      This instruction possibly has a legal segment override on the
6742      second operand, so copy the segment to where non-string
6743      instructions store it, allowing common code.  */
6744   i.seg[op] = i.seg[1];
6745
6746   return 1;
6747 }
6748
6749 static int
6750 process_suffix (void)
6751 {
6752   /* If matched instruction specifies an explicit instruction mnemonic
6753      suffix, use it.  */
6754   if (i.tm.opcode_modifier.size == SIZE16)
6755     i.suffix = WORD_MNEM_SUFFIX;
6756   else if (i.tm.opcode_modifier.size == SIZE32)
6757     i.suffix = LONG_MNEM_SUFFIX;
6758   else if (i.tm.opcode_modifier.size == SIZE64)
6759     i.suffix = QWORD_MNEM_SUFFIX;
6760   else if (i.reg_operands
6761            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6762            && !i.tm.opcode_modifier.addrprefixopreg)
6763     {
6764       unsigned int numop = i.operands;
6765
6766       /* movsx/movzx want only their source operand considered here, for the
6767          ambiguity checking below.  The suffix will be replaced afterwards
6768          to represent the destination (register).  */
6769       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6770           || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6771         --i.operands;
6772
6773       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6774       if (i.tm.base_opcode == 0xf20f38f0
6775           && i.tm.operand_types[1].bitfield.qword)
6776         i.rex |= REX_W;
6777
6778       /* If there's no instruction mnemonic suffix we try to invent one
6779          based on GPR operands.  */
6780       if (!i.suffix)
6781         {
6782           /* We take i.suffix from the last register operand specified,
6783              Destination register type is more significant than source
6784              register type.  crc32 in SSE4.2 prefers source register
6785              type. */
6786           unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6787
6788           while (op--)
6789             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6790                 || i.tm.operand_types[op].bitfield.instance == Accum)
6791               {
6792                 if (i.types[op].bitfield.class != Reg)
6793                   continue;
6794                 if (i.types[op].bitfield.byte)
6795                   i.suffix = BYTE_MNEM_SUFFIX;
6796                 else if (i.types[op].bitfield.word)
6797                   i.suffix = WORD_MNEM_SUFFIX;
6798                 else if (i.types[op].bitfield.dword)
6799                   i.suffix = LONG_MNEM_SUFFIX;
6800                 else if (i.types[op].bitfield.qword)
6801                   i.suffix = QWORD_MNEM_SUFFIX;
6802                 else
6803                   continue;
6804                 break;
6805               }
6806
6807           /* As an exception, movsx/movzx silently default to a byte source
6808              in AT&T mode.  */
6809           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6810               && !i.suffix && !intel_syntax)
6811             i.suffix = BYTE_MNEM_SUFFIX;
6812         }
6813       else if (i.suffix == BYTE_MNEM_SUFFIX)
6814         {
6815           if (intel_syntax
6816               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6817               && i.tm.opcode_modifier.no_bsuf)
6818             i.suffix = 0;
6819           else if (!check_byte_reg ())
6820             return 0;
6821         }
6822       else if (i.suffix == LONG_MNEM_SUFFIX)
6823         {
6824           if (intel_syntax
6825               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6826               && i.tm.opcode_modifier.no_lsuf
6827               && !i.tm.opcode_modifier.todword
6828               && !i.tm.opcode_modifier.toqword)
6829             i.suffix = 0;
6830           else if (!check_long_reg ())
6831             return 0;
6832         }
6833       else if (i.suffix == QWORD_MNEM_SUFFIX)
6834         {
6835           if (intel_syntax
6836               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6837               && i.tm.opcode_modifier.no_qsuf
6838               && !i.tm.opcode_modifier.todword
6839               && !i.tm.opcode_modifier.toqword)
6840             i.suffix = 0;
6841           else if (!check_qword_reg ())
6842             return 0;
6843         }
6844       else if (i.suffix == WORD_MNEM_SUFFIX)
6845         {
6846           if (intel_syntax
6847               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6848               && i.tm.opcode_modifier.no_wsuf)
6849             i.suffix = 0;
6850           else if (!check_word_reg ())
6851             return 0;
6852         }
6853       else if (intel_syntax
6854                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6855         /* Do nothing if the instruction is going to ignore the prefix.  */
6856         ;
6857       else
6858         abort ();
6859
6860       /* Undo the movsx/movzx change done above.  */
6861       i.operands = numop;
6862     }
6863   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6864            && !i.suffix)
6865     {
6866       i.suffix = stackop_size;
6867       if (stackop_size == LONG_MNEM_SUFFIX)
6868         {
6869           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6870              .code16gcc directive to support 16-bit mode with
6871              32-bit address.  For IRET without a suffix, generate
6872              16-bit IRET (opcode 0xcf) to return from an interrupt
6873              handler.  */
6874           if (i.tm.base_opcode == 0xcf)
6875             {
6876               i.suffix = WORD_MNEM_SUFFIX;
6877               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6878             }
6879           /* Warn about changed behavior for segment register push/pop.  */
6880           else if ((i.tm.base_opcode | 1) == 0x07)
6881             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6882                      i.tm.name);
6883         }
6884     }
6885   else if (!i.suffix
6886            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6887                || i.tm.opcode_modifier.jump == JUMP_BYTE
6888                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6889                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6890                    && i.tm.extension_opcode <= 3)))
6891     {
6892       switch (flag_code)
6893         {
6894         case CODE_64BIT:
6895           if (!i.tm.opcode_modifier.no_qsuf)
6896             {
6897               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6898                   || i.tm.opcode_modifier.no_lsuf)
6899                 i.suffix = QWORD_MNEM_SUFFIX;
6900               break;
6901             }
6902           /* Fall through.  */
6903         case CODE_32BIT:
6904           if (!i.tm.opcode_modifier.no_lsuf)
6905             i.suffix = LONG_MNEM_SUFFIX;
6906           break;
6907         case CODE_16BIT:
6908           if (!i.tm.opcode_modifier.no_wsuf)
6909             i.suffix = WORD_MNEM_SUFFIX;
6910           break;
6911         }
6912     }
6913
6914   if (!i.suffix
6915       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6916           /* Also cover lret/retf/iret in 64-bit mode.  */
6917           || (flag_code == CODE_64BIT
6918               && !i.tm.opcode_modifier.no_lsuf
6919               && !i.tm.opcode_modifier.no_qsuf))
6920       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6921       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6922       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6923       /* Accept FLDENV et al without suffix.  */
6924       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6925     {
6926       unsigned int suffixes, evex = 0;
6927
6928       suffixes = !i.tm.opcode_modifier.no_bsuf;
6929       if (!i.tm.opcode_modifier.no_wsuf)
6930         suffixes |= 1 << 1;
6931       if (!i.tm.opcode_modifier.no_lsuf)
6932         suffixes |= 1 << 2;
6933       if (!i.tm.opcode_modifier.no_ldsuf)
6934         suffixes |= 1 << 3;
6935       if (!i.tm.opcode_modifier.no_ssuf)
6936         suffixes |= 1 << 4;
6937       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6938         suffixes |= 1 << 5;
6939
6940       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6941          also suitable for AT&T syntax mode, it was requested that this be
6942          restricted to just Intel syntax.  */
6943       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6944         {
6945           unsigned int op;
6946
6947           for (op = 0; op < i.tm.operands; ++op)
6948             {
6949               if (is_evex_encoding (&i.tm)
6950                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6951                 {
6952                   if (i.tm.operand_types[op].bitfield.ymmword)
6953                     i.tm.operand_types[op].bitfield.xmmword = 0;
6954                   if (i.tm.operand_types[op].bitfield.zmmword)
6955                     i.tm.operand_types[op].bitfield.ymmword = 0;
6956                   if (!i.tm.opcode_modifier.evex
6957                       || i.tm.opcode_modifier.evex == EVEXDYN)
6958                     i.tm.opcode_modifier.evex = EVEX512;
6959                 }
6960
6961               if (i.tm.operand_types[op].bitfield.xmmword
6962                   + i.tm.operand_types[op].bitfield.ymmword
6963                   + i.tm.operand_types[op].bitfield.zmmword < 2)
6964                 continue;
6965
6966               /* Any properly sized operand disambiguates the insn.  */
6967               if (i.types[op].bitfield.xmmword
6968                   || i.types[op].bitfield.ymmword
6969                   || i.types[op].bitfield.zmmword)
6970                 {
6971                   suffixes &= ~(7 << 6);
6972                   evex = 0;
6973                   break;
6974                 }
6975
6976               if ((i.flags[op] & Operand_Mem)
6977                   && i.tm.operand_types[op].bitfield.unspecified)
6978                 {
6979                   if (i.tm.operand_types[op].bitfield.xmmword)
6980                     suffixes |= 1 << 6;
6981                   if (i.tm.operand_types[op].bitfield.ymmword)
6982                     suffixes |= 1 << 7;
6983                   if (i.tm.operand_types[op].bitfield.zmmword)
6984                     suffixes |= 1 << 8;
6985                   if (is_evex_encoding (&i.tm))
6986                     evex = EVEX512;
6987                 }
6988             }
6989         }
6990
6991       /* Are multiple suffixes / operand sizes allowed?  */
6992       if (suffixes & (suffixes - 1))
6993         {
6994           if (intel_syntax
6995               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6996                   || operand_check == check_error))
6997             {
6998               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6999               return 0;
7000             }
7001           if (operand_check == check_error)
7002             {
7003               as_bad (_("no instruction mnemonic suffix given and "
7004                         "no register operands; can't size `%s'"), i.tm.name);
7005               return 0;
7006             }
7007           if (operand_check == check_warning)
7008             as_warn (_("%s; using default for `%s'"),
7009                        intel_syntax
7010                        ? _("ambiguous operand size")
7011                        : _("no instruction mnemonic suffix given and "
7012                            "no register operands"),
7013                        i.tm.name);
7014
7015           if (i.tm.opcode_modifier.floatmf)
7016             i.suffix = SHORT_MNEM_SUFFIX;
7017           else if ((i.tm.base_opcode | 8) == 0xfbe
7018                    || (i.tm.base_opcode == 0x63
7019                        && i.tm.cpu_flags.bitfield.cpu64))
7020             /* handled below */;
7021           else if (evex)
7022             i.tm.opcode_modifier.evex = evex;
7023           else if (flag_code == CODE_16BIT)
7024             i.suffix = WORD_MNEM_SUFFIX;
7025           else if (!i.tm.opcode_modifier.no_lsuf)
7026             i.suffix = LONG_MNEM_SUFFIX;
7027           else
7028             i.suffix = QWORD_MNEM_SUFFIX;
7029         }
7030     }
7031
7032   if ((i.tm.base_opcode | 8) == 0xfbe
7033       || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7034     {
7035       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7036          In AT&T syntax, if there is no suffix (warned about above), the default
7037          will be byte extension.  */
7038       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7039         i.tm.base_opcode |= 1;
7040
7041       /* For further processing, the suffix should represent the destination
7042          (register).  This is already the case when one was used with
7043          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7044          no suffix to begin with.  */
7045       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7046         {
7047           if (i.types[1].bitfield.word)
7048             i.suffix = WORD_MNEM_SUFFIX;
7049           else if (i.types[1].bitfield.qword)
7050             i.suffix = QWORD_MNEM_SUFFIX;
7051           else
7052             i.suffix = LONG_MNEM_SUFFIX;
7053
7054           i.tm.opcode_modifier.w = 0;
7055         }
7056     }
7057
7058   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7059     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7060                    != (i.tm.operand_types[1].bitfield.class == Reg);
7061
7062   /* Change the opcode based on the operand size given by i.suffix.  */
7063   switch (i.suffix)
7064     {
7065     /* Size floating point instruction.  */
7066     case LONG_MNEM_SUFFIX:
7067       if (i.tm.opcode_modifier.floatmf)
7068         {
7069           i.tm.base_opcode ^= 4;
7070           break;
7071         }
7072     /* fall through */
7073     case WORD_MNEM_SUFFIX:
7074     case QWORD_MNEM_SUFFIX:
7075       /* It's not a byte, select word/dword operation.  */
7076       if (i.tm.opcode_modifier.w)
7077         {
7078           if (i.short_form)
7079             i.tm.base_opcode |= 8;
7080           else
7081             i.tm.base_opcode |= 1;
7082         }
7083     /* fall through */
7084     case SHORT_MNEM_SUFFIX:
7085       /* Now select between word & dword operations via the operand
7086          size prefix, except for instructions that will ignore this
7087          prefix anyway.  */
7088       if (i.suffix != QWORD_MNEM_SUFFIX
7089           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7090           && !i.tm.opcode_modifier.floatmf
7091           && !is_any_vex_encoding (&i.tm)
7092           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7093               || (flag_code == CODE_64BIT
7094                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7095         {
7096           unsigned int prefix = DATA_PREFIX_OPCODE;
7097
7098           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7099             prefix = ADDR_PREFIX_OPCODE;
7100
7101           if (!add_prefix (prefix))
7102             return 0;
7103         }
7104
7105       /* Set mode64 for an operand.  */
7106       if (i.suffix == QWORD_MNEM_SUFFIX
7107           && flag_code == CODE_64BIT
7108           && !i.tm.opcode_modifier.norex64
7109           && !i.tm.opcode_modifier.vexw
7110           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7111              need rex64. */
7112           && ! (i.operands == 2
7113                 && i.tm.base_opcode == 0x90
7114                 && i.tm.extension_opcode == None
7115                 && i.types[0].bitfield.instance == Accum
7116                 && i.types[0].bitfield.qword
7117                 && i.types[1].bitfield.instance == Accum
7118                 && i.types[1].bitfield.qword))
7119         i.rex |= REX_W;
7120
7121       break;
7122
7123     case 0:
7124       /* Select word/dword/qword operation with explict data sizing prefix
7125          when there are no suitable register operands.  */
7126       if (i.tm.opcode_modifier.w
7127           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7128           && (!i.reg_operands
7129               || (i.reg_operands == 1
7130                       /* ShiftCount */
7131                   && (i.tm.operand_types[0].bitfield.instance == RegC
7132                       /* InOutPortReg */
7133                       || i.tm.operand_types[0].bitfield.instance == RegD
7134                       || i.tm.operand_types[1].bitfield.instance == RegD
7135                       /* CRC32 */
7136                       || i.tm.base_opcode == 0xf20f38f0))))
7137         i.tm.base_opcode |= 1;
7138       break;
7139     }
7140
7141   if (i.tm.opcode_modifier.addrprefixopreg)
7142     {
7143       gas_assert (!i.suffix);
7144       gas_assert (i.reg_operands);
7145
7146       if (i.tm.operand_types[0].bitfield.instance == Accum
7147           || i.operands == 1)
7148         {
7149           /* The address size override prefix changes the size of the
7150              first operand.  */
7151           if (flag_code == CODE_64BIT
7152               && i.op[0].regs->reg_type.bitfield.word)
7153             {
7154               as_bad (_("16-bit addressing unavailable for `%s'"),
7155                       i.tm.name);
7156               return 0;
7157             }
7158
7159           if ((flag_code == CODE_32BIT
7160                ? i.op[0].regs->reg_type.bitfield.word
7161                : i.op[0].regs->reg_type.bitfield.dword)
7162               && !add_prefix (ADDR_PREFIX_OPCODE))
7163             return 0;
7164         }
7165       else
7166         {
7167           /* Check invalid register operand when the address size override
7168              prefix changes the size of register operands.  */
7169           unsigned int op;
7170           enum { need_word, need_dword, need_qword } need;
7171
7172           if (flag_code == CODE_32BIT)
7173             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7174           else if (i.prefix[ADDR_PREFIX])
7175             need = need_dword;
7176           else
7177             need = flag_code == CODE_64BIT ? need_qword : need_word;
7178
7179           for (op = 0; op < i.operands; op++)
7180             {
7181               if (i.types[op].bitfield.class != Reg)
7182                 continue;
7183
7184               switch (need)
7185                 {
7186                 case need_word:
7187                   if (i.op[op].regs->reg_type.bitfield.word)
7188                     continue;
7189                   break;
7190                 case need_dword:
7191                   if (i.op[op].regs->reg_type.bitfield.dword)
7192                     continue;
7193                   break;
7194                 case need_qword:
7195                   if (i.op[op].regs->reg_type.bitfield.qword)
7196                     continue;
7197                   break;
7198                 }
7199
7200               as_bad (_("invalid register operand size for `%s'"),
7201                       i.tm.name);
7202               return 0;
7203             }
7204         }
7205     }
7206
7207   return 1;
7208 }
7209
7210 static int
7211 check_byte_reg (void)
7212 {
7213   int op;
7214
7215   for (op = i.operands; --op >= 0;)
7216     {
7217       /* Skip non-register operands. */
7218       if (i.types[op].bitfield.class != Reg)
7219         continue;
7220
7221       /* If this is an eight bit register, it's OK.  If it's the 16 or
7222          32 bit version of an eight bit register, we will just use the
7223          low portion, and that's OK too.  */
7224       if (i.types[op].bitfield.byte)
7225         continue;
7226
7227       /* I/O port address operands are OK too.  */
7228       if (i.tm.operand_types[op].bitfield.instance == RegD
7229           && i.tm.operand_types[op].bitfield.word)
7230         continue;
7231
7232       /* crc32 only wants its source operand checked here.  */
7233       if (i.tm.base_opcode == 0xf20f38f0 && op)
7234         continue;
7235
7236       /* Any other register is bad.  */
7237       as_bad (_("`%s%s' not allowed with `%s%c'"),
7238               register_prefix, i.op[op].regs->reg_name,
7239               i.tm.name, i.suffix);
7240       return 0;
7241     }
7242   return 1;
7243 }
7244
7245 static int
7246 check_long_reg (void)
7247 {
7248   int op;
7249
7250   for (op = i.operands; --op >= 0;)
7251     /* Skip non-register operands. */
7252     if (i.types[op].bitfield.class != Reg)
7253       continue;
7254     /* Reject eight bit registers, except where the template requires
7255        them. (eg. movzb)  */
7256     else if (i.types[op].bitfield.byte
7257              && (i.tm.operand_types[op].bitfield.class == Reg
7258                  || i.tm.operand_types[op].bitfield.instance == Accum)
7259              && (i.tm.operand_types[op].bitfield.word
7260                  || i.tm.operand_types[op].bitfield.dword))
7261       {
7262         as_bad (_("`%s%s' not allowed with `%s%c'"),
7263                 register_prefix,
7264                 i.op[op].regs->reg_name,
7265                 i.tm.name,
7266                 i.suffix);
7267         return 0;
7268       }
7269     /* Error if the e prefix on a general reg is missing.  */
7270     else if (i.types[op].bitfield.word
7271              && (i.tm.operand_types[op].bitfield.class == Reg
7272                  || i.tm.operand_types[op].bitfield.instance == Accum)
7273              && i.tm.operand_types[op].bitfield.dword)
7274       {
7275         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7276                 register_prefix, i.op[op].regs->reg_name,
7277                 i.suffix);
7278         return 0;
7279       }
7280     /* Warn if the r prefix on a general reg is present.  */
7281     else if (i.types[op].bitfield.qword
7282              && (i.tm.operand_types[op].bitfield.class == Reg
7283                  || i.tm.operand_types[op].bitfield.instance == Accum)
7284              && i.tm.operand_types[op].bitfield.dword)
7285       {
7286         if (intel_syntax
7287             && i.tm.opcode_modifier.toqword
7288             && i.types[0].bitfield.class != RegSIMD)
7289           {
7290             /* Convert to QWORD.  We want REX byte. */
7291             i.suffix = QWORD_MNEM_SUFFIX;
7292           }
7293         else
7294           {
7295             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7296                     register_prefix, i.op[op].regs->reg_name,
7297                     i.suffix);
7298             return 0;
7299           }
7300       }
7301   return 1;
7302 }
7303
7304 static int
7305 check_qword_reg (void)
7306 {
7307   int op;
7308
7309   for (op = i.operands; --op >= 0; )
7310     /* Skip non-register operands. */
7311     if (i.types[op].bitfield.class != Reg)
7312       continue;
7313     /* Reject eight bit registers, except where the template requires
7314        them. (eg. movzb)  */
7315     else if (i.types[op].bitfield.byte
7316              && (i.tm.operand_types[op].bitfield.class == Reg
7317                  || i.tm.operand_types[op].bitfield.instance == Accum)
7318              && (i.tm.operand_types[op].bitfield.word
7319                  || i.tm.operand_types[op].bitfield.dword))
7320       {
7321         as_bad (_("`%s%s' not allowed with `%s%c'"),
7322                 register_prefix,
7323                 i.op[op].regs->reg_name,
7324                 i.tm.name,
7325                 i.suffix);
7326         return 0;
7327       }
7328     /* Warn if the r prefix on a general reg is missing.  */
7329     else if ((i.types[op].bitfield.word
7330               || i.types[op].bitfield.dword)
7331              && (i.tm.operand_types[op].bitfield.class == Reg
7332                  || i.tm.operand_types[op].bitfield.instance == Accum)
7333              && i.tm.operand_types[op].bitfield.qword)
7334       {
7335         /* Prohibit these changes in the 64bit mode, since the
7336            lowering is more complicated.  */
7337         if (intel_syntax
7338             && i.tm.opcode_modifier.todword
7339             && i.types[0].bitfield.class != RegSIMD)
7340           {
7341             /* Convert to DWORD.  We don't want REX byte. */
7342             i.suffix = LONG_MNEM_SUFFIX;
7343           }
7344         else
7345           {
7346             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7347                     register_prefix, i.op[op].regs->reg_name,
7348                     i.suffix);
7349             return 0;
7350           }
7351       }
7352   return 1;
7353 }
7354
7355 static int
7356 check_word_reg (void)
7357 {
7358   int op;
7359   for (op = i.operands; --op >= 0;)
7360     /* Skip non-register operands. */
7361     if (i.types[op].bitfield.class != Reg)
7362       continue;
7363     /* Reject eight bit registers, except where the template requires
7364        them. (eg. movzb)  */
7365     else if (i.types[op].bitfield.byte
7366              && (i.tm.operand_types[op].bitfield.class == Reg
7367                  || i.tm.operand_types[op].bitfield.instance == Accum)
7368              && (i.tm.operand_types[op].bitfield.word
7369                  || i.tm.operand_types[op].bitfield.dword))
7370       {
7371         as_bad (_("`%s%s' not allowed with `%s%c'"),
7372                 register_prefix,
7373                 i.op[op].regs->reg_name,
7374                 i.tm.name,
7375                 i.suffix);
7376         return 0;
7377       }
7378     /* Error if the e or r prefix on a general reg is present.  */
7379     else if ((i.types[op].bitfield.dword
7380                  || i.types[op].bitfield.qword)
7381              && (i.tm.operand_types[op].bitfield.class == Reg
7382                  || i.tm.operand_types[op].bitfield.instance == Accum)
7383              && i.tm.operand_types[op].bitfield.word)
7384       {
7385         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7386                 register_prefix, i.op[op].regs->reg_name,
7387                 i.suffix);
7388         return 0;
7389       }
7390   return 1;
7391 }
7392
7393 static int
7394 update_imm (unsigned int j)
7395 {
7396   i386_operand_type overlap = i.types[j];
7397   if ((overlap.bitfield.imm8
7398        || overlap.bitfield.imm8s
7399        || overlap.bitfield.imm16
7400        || overlap.bitfield.imm32
7401        || overlap.bitfield.imm32s
7402        || overlap.bitfield.imm64)
7403       && !operand_type_equal (&overlap, &imm8)
7404       && !operand_type_equal (&overlap, &imm8s)
7405       && !operand_type_equal (&overlap, &imm16)
7406       && !operand_type_equal (&overlap, &imm32)
7407       && !operand_type_equal (&overlap, &imm32s)
7408       && !operand_type_equal (&overlap, &imm64))
7409     {
7410       if (i.suffix)
7411         {
7412           i386_operand_type temp;
7413
7414           operand_type_set (&temp, 0);
7415           if (i.suffix == BYTE_MNEM_SUFFIX)
7416             {
7417               temp.bitfield.imm8 = overlap.bitfield.imm8;
7418               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7419             }
7420           else if (i.suffix == WORD_MNEM_SUFFIX)
7421             temp.bitfield.imm16 = overlap.bitfield.imm16;
7422           else if (i.suffix == QWORD_MNEM_SUFFIX)
7423             {
7424               temp.bitfield.imm64 = overlap.bitfield.imm64;
7425               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7426             }
7427           else
7428             temp.bitfield.imm32 = overlap.bitfield.imm32;
7429           overlap = temp;
7430         }
7431       else if (operand_type_equal (&overlap, &imm16_32_32s)
7432                || operand_type_equal (&overlap, &imm16_32)
7433                || operand_type_equal (&overlap, &imm16_32s))
7434         {
7435           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7436             overlap = imm16;
7437           else
7438             overlap = imm32s;
7439         }
7440       else if (i.prefix[REX_PREFIX] & REX_W)
7441         overlap = operand_type_and (overlap, imm32s);
7442       else if (i.prefix[DATA_PREFIX])
7443         overlap = operand_type_and (overlap,
7444                                     flag_code != CODE_16BIT ? imm16 : imm32);
7445       if (!operand_type_equal (&overlap, &imm8)
7446           && !operand_type_equal (&overlap, &imm8s)
7447           && !operand_type_equal (&overlap, &imm16)
7448           && !operand_type_equal (&overlap, &imm32)
7449           && !operand_type_equal (&overlap, &imm32s)
7450           && !operand_type_equal (&overlap, &imm64))
7451         {
7452           as_bad (_("no instruction mnemonic suffix given; "
7453                     "can't determine immediate size"));
7454           return 0;
7455         }
7456     }
7457   i.types[j] = overlap;
7458
7459   return 1;
7460 }
7461
7462 static int
7463 finalize_imm (void)
7464 {
7465   unsigned int j, n;
7466
7467   /* Update the first 2 immediate operands.  */
7468   n = i.operands > 2 ? 2 : i.operands;
7469   if (n)
7470     {
7471       for (j = 0; j < n; j++)
7472         if (update_imm (j) == 0)
7473           return 0;
7474
7475       /* The 3rd operand can't be immediate operand.  */
7476       gas_assert (operand_type_check (i.types[2], imm) == 0);
7477     }
7478
7479   return 1;
7480 }
7481
7482 static int
7483 process_operands (void)
7484 {
7485   /* Default segment register this instruction will use for memory
7486      accesses.  0 means unknown.  This is only for optimizing out
7487      unnecessary segment overrides.  */
7488   const seg_entry *default_seg = 0;
7489
7490   if (i.tm.opcode_modifier.sse2avx)
7491     {
7492       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7493          need converting.  */
7494       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7495       i.prefix[REX_PREFIX] = 0;
7496       i.rex_encoding = 0;
7497     }
7498   /* ImmExt should be processed after SSE2AVX.  */
7499   else if (i.tm.opcode_modifier.immext)
7500     process_immext ();
7501
7502   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7503     {
7504       unsigned int dupl = i.operands;
7505       unsigned int dest = dupl - 1;
7506       unsigned int j;
7507
7508       /* The destination must be an xmm register.  */
7509       gas_assert (i.reg_operands
7510                   && MAX_OPERANDS > dupl
7511                   && operand_type_equal (&i.types[dest], &regxmm));
7512
7513       if (i.tm.operand_types[0].bitfield.instance == Accum
7514           && i.tm.operand_types[0].bitfield.xmmword)
7515         {
7516           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7517             {
7518               /* Keep xmm0 for instructions with VEX prefix and 3
7519                  sources.  */
7520               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7521               i.tm.operand_types[0].bitfield.class = RegSIMD;
7522               goto duplicate;
7523             }
7524           else
7525             {
7526               /* We remove the first xmm0 and keep the number of
7527                  operands unchanged, which in fact duplicates the
7528                  destination.  */
7529               for (j = 1; j < i.operands; j++)
7530                 {
7531                   i.op[j - 1] = i.op[j];
7532                   i.types[j - 1] = i.types[j];
7533                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7534                   i.flags[j - 1] = i.flags[j];
7535                 }
7536             }
7537         }
7538       else if (i.tm.opcode_modifier.implicit1stxmm0)
7539         {
7540           gas_assert ((MAX_OPERANDS - 1) > dupl
7541                       && (i.tm.opcode_modifier.vexsources
7542                           == VEX3SOURCES));
7543
7544           /* Add the implicit xmm0 for instructions with VEX prefix
7545              and 3 sources.  */
7546           for (j = i.operands; j > 0; j--)
7547             {
7548               i.op[j] = i.op[j - 1];
7549               i.types[j] = i.types[j - 1];
7550               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7551               i.flags[j] = i.flags[j - 1];
7552             }
7553           i.op[0].regs
7554             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7555           i.types[0] = regxmm;
7556           i.tm.operand_types[0] = regxmm;
7557
7558           i.operands += 2;
7559           i.reg_operands += 2;
7560           i.tm.operands += 2;
7561
7562           dupl++;
7563           dest++;
7564           i.op[dupl] = i.op[dest];
7565           i.types[dupl] = i.types[dest];
7566           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7567           i.flags[dupl] = i.flags[dest];
7568         }
7569       else
7570         {
7571         duplicate:
7572           i.operands++;
7573           i.reg_operands++;
7574           i.tm.operands++;
7575
7576           i.op[dupl] = i.op[dest];
7577           i.types[dupl] = i.types[dest];
7578           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7579           i.flags[dupl] = i.flags[dest];
7580         }
7581
7582        if (i.tm.opcode_modifier.immext)
7583          process_immext ();
7584     }
7585   else if (i.tm.operand_types[0].bitfield.instance == Accum
7586            && i.tm.operand_types[0].bitfield.xmmword)
7587     {
7588       unsigned int j;
7589
7590       for (j = 1; j < i.operands; j++)
7591         {
7592           i.op[j - 1] = i.op[j];
7593           i.types[j - 1] = i.types[j];
7594
7595           /* We need to adjust fields in i.tm since they are used by
7596              build_modrm_byte.  */
7597           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7598
7599           i.flags[j - 1] = i.flags[j];
7600         }
7601
7602       i.operands--;
7603       i.reg_operands--;
7604       i.tm.operands--;
7605     }
7606   else if (i.tm.opcode_modifier.implicitquadgroup)
7607     {
7608       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7609
7610       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7611       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7612       regnum = register_number (i.op[1].regs);
7613       first_reg_in_group = regnum & ~3;
7614       last_reg_in_group = first_reg_in_group + 3;
7615       if (regnum != first_reg_in_group)
7616         as_warn (_("source register `%s%s' implicitly denotes"
7617                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7618                  register_prefix, i.op[1].regs->reg_name,
7619                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7620                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7621                  i.tm.name);
7622     }
7623   else if (i.tm.opcode_modifier.regkludge)
7624     {
7625       /* The imul $imm, %reg instruction is converted into
7626          imul $imm, %reg, %reg, and the clr %reg instruction
7627          is converted into xor %reg, %reg.  */
7628
7629       unsigned int first_reg_op;
7630
7631       if (operand_type_check (i.types[0], reg))
7632         first_reg_op = 0;
7633       else
7634         first_reg_op = 1;
7635       /* Pretend we saw the extra register operand.  */
7636       gas_assert (i.reg_operands == 1
7637                   && i.op[first_reg_op + 1].regs == 0);
7638       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7639       i.types[first_reg_op + 1] = i.types[first_reg_op];
7640       i.operands++;
7641       i.reg_operands++;
7642     }
7643
7644   if (i.tm.opcode_modifier.modrm)
7645     {
7646       /* The opcode is completed (modulo i.tm.extension_opcode which
7647          must be put into the modrm byte).  Now, we make the modrm and
7648          index base bytes based on all the info we've collected.  */
7649
7650       default_seg = build_modrm_byte ();
7651     }
7652   else if (i.types[0].bitfield.class == SReg)
7653     {
7654       if (flag_code != CODE_64BIT
7655           ? i.tm.base_opcode == POP_SEG_SHORT
7656             && i.op[0].regs->reg_num == 1
7657           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7658             && i.op[0].regs->reg_num < 4)
7659         {
7660           as_bad (_("you can't `%s %s%s'"),
7661                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7662           return 0;
7663         }
7664       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7665         {
7666           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7667           i.tm.opcode_length = 2;
7668         }
7669       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7670     }
7671   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7672     {
7673       default_seg = &ds;
7674     }
7675   else if (i.tm.opcode_modifier.isstring)
7676     {
7677       /* For the string instructions that allow a segment override
7678          on one of their operands, the default segment is ds.  */
7679       default_seg = &ds;
7680     }
7681   else if (i.short_form)
7682     {
7683       /* The register or float register operand is in operand
7684          0 or 1.  */
7685       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7686
7687       /* Register goes in low 3 bits of opcode.  */
7688       i.tm.base_opcode |= i.op[op].regs->reg_num;
7689       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7690         i.rex |= REX_B;
7691       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7692         {
7693           /* Warn about some common errors, but press on regardless.
7694              The first case can be generated by gcc (<= 2.8.1).  */
7695           if (i.operands == 2)
7696             {
7697               /* Reversed arguments on faddp, fsubp, etc.  */
7698               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7699                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7700                        register_prefix, i.op[intel_syntax].regs->reg_name);
7701             }
7702           else
7703             {
7704               /* Extraneous `l' suffix on fp insn.  */
7705               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7706                        register_prefix, i.op[0].regs->reg_name);
7707             }
7708         }
7709     }
7710
7711   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7712       && i.tm.base_opcode == 0x8d /* lea */
7713       && !is_any_vex_encoding(&i.tm))
7714     {
7715       if (!quiet_warnings)
7716         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7717       if (optimize)
7718         {
7719           i.seg[0] = NULL;
7720           i.prefix[SEG_PREFIX] = 0;
7721         }
7722     }
7723
7724   /* If a segment was explicitly specified, and the specified segment
7725      is neither the default nor the one already recorded from a prefix,
7726      use an opcode prefix to select it.  If we never figured out what
7727      the default segment is, then default_seg will be zero at this
7728      point, and the specified segment prefix will always be used.  */
7729   if (i.seg[0]
7730       && i.seg[0] != default_seg
7731       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7732     {
7733       if (!add_prefix (i.seg[0]->seg_prefix))
7734         return 0;
7735     }
7736   return 1;
7737 }
7738
7739 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7740                                  bfd_boolean do_sse2avx)
7741 {
7742   if (r->reg_flags & RegRex)
7743     {
7744       if (i.rex & rex_bit)
7745         as_bad (_("same type of prefix used twice"));
7746       i.rex |= rex_bit;
7747     }
7748   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7749     {
7750       gas_assert (i.vex.register_specifier == r);
7751       i.vex.register_specifier += 8;
7752     }
7753
7754   if (r->reg_flags & RegVRex)
7755     i.vrex |= rex_bit;
7756 }
7757
7758 static const seg_entry *
7759 build_modrm_byte (void)
7760 {
7761   const seg_entry *default_seg = 0;
7762   unsigned int source, dest;
7763   int vex_3_sources;
7764
7765   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7766   if (vex_3_sources)
7767     {
7768       unsigned int nds, reg_slot;
7769       expressionS *exp;
7770
7771       dest = i.operands - 1;
7772       nds = dest - 1;
7773
7774       /* There are 2 kinds of instructions:
7775          1. 5 operands: 4 register operands or 3 register operands
7776          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7777          VexW0 or VexW1.  The destination must be either XMM, YMM or
7778          ZMM register.
7779          2. 4 operands: 4 register operands or 3 register operands
7780          plus 1 memory operand, with VexXDS.  */
7781       gas_assert ((i.reg_operands == 4
7782                    || (i.reg_operands == 3 && i.mem_operands == 1))
7783                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7784                   && i.tm.opcode_modifier.vexw
7785                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7786
7787       /* If VexW1 is set, the first non-immediate operand is the source and
7788          the second non-immediate one is encoded in the immediate operand.  */
7789       if (i.tm.opcode_modifier.vexw == VEXW1)
7790         {
7791           source = i.imm_operands;
7792           reg_slot = i.imm_operands + 1;
7793         }
7794       else
7795         {
7796           source = i.imm_operands + 1;
7797           reg_slot = i.imm_operands;
7798         }
7799
7800       if (i.imm_operands == 0)
7801         {
7802           /* When there is no immediate operand, generate an 8bit
7803              immediate operand to encode the first operand.  */
7804           exp = &im_expressions[i.imm_operands++];
7805           i.op[i.operands].imms = exp;
7806           i.types[i.operands] = imm8;
7807           i.operands++;
7808
7809           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7810           exp->X_op = O_constant;
7811           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7812           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7813         }
7814       else
7815         {
7816           gas_assert (i.imm_operands == 1);
7817           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7818           gas_assert (!i.tm.opcode_modifier.immext);
7819
7820           /* Turn on Imm8 again so that output_imm will generate it.  */
7821           i.types[0].bitfield.imm8 = 1;
7822
7823           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7824           i.op[0].imms->X_add_number
7825               |= register_number (i.op[reg_slot].regs) << 4;
7826           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7827         }
7828
7829       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7830       i.vex.register_specifier = i.op[nds].regs;
7831     }
7832   else
7833     source = dest = 0;
7834
7835   /* i.reg_operands MUST be the number of real register operands;
7836      implicit registers do not count.  If there are 3 register
7837      operands, it must be a instruction with VexNDS.  For a
7838      instruction with VexNDD, the destination register is encoded
7839      in VEX prefix.  If there are 4 register operands, it must be
7840      a instruction with VEX prefix and 3 sources.  */
7841   if (i.mem_operands == 0
7842       && ((i.reg_operands == 2
7843            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7844           || (i.reg_operands == 3
7845               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7846           || (i.reg_operands == 4 && vex_3_sources)))
7847     {
7848       switch (i.operands)
7849         {
7850         case 2:
7851           source = 0;
7852           break;
7853         case 3:
7854           /* When there are 3 operands, one of them may be immediate,
7855              which may be the first or the last operand.  Otherwise,
7856              the first operand must be shift count register (cl) or it
7857              is an instruction with VexNDS. */
7858           gas_assert (i.imm_operands == 1
7859                       || (i.imm_operands == 0
7860                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7861                               || (i.types[0].bitfield.instance == RegC
7862                                   && i.types[0].bitfield.byte))));
7863           if (operand_type_check (i.types[0], imm)
7864               || (i.types[0].bitfield.instance == RegC
7865                   && i.types[0].bitfield.byte))
7866             source = 1;
7867           else
7868             source = 0;
7869           break;
7870         case 4:
7871           /* When there are 4 operands, the first two must be 8bit
7872              immediate operands. The source operand will be the 3rd
7873              one.
7874
7875              For instructions with VexNDS, if the first operand
7876              an imm8, the source operand is the 2nd one.  If the last
7877              operand is imm8, the source operand is the first one.  */
7878           gas_assert ((i.imm_operands == 2
7879                        && i.types[0].bitfield.imm8
7880                        && i.types[1].bitfield.imm8)
7881                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7882                           && i.imm_operands == 1
7883                           && (i.types[0].bitfield.imm8
7884                               || i.types[i.operands - 1].bitfield.imm8
7885                               || i.rounding)));
7886           if (i.imm_operands == 2)
7887             source = 2;
7888           else
7889             {
7890               if (i.types[0].bitfield.imm8)
7891                 source = 1;
7892               else
7893                 source = 0;
7894             }
7895           break;
7896         case 5:
7897           if (is_evex_encoding (&i.tm))
7898             {
7899               /* For EVEX instructions, when there are 5 operands, the
7900                  first one must be immediate operand.  If the second one
7901                  is immediate operand, the source operand is the 3th
7902                  one.  If the last one is immediate operand, the source
7903                  operand is the 2nd one.  */
7904               gas_assert (i.imm_operands == 2
7905                           && i.tm.opcode_modifier.sae
7906                           && operand_type_check (i.types[0], imm));
7907               if (operand_type_check (i.types[1], imm))
7908                 source = 2;
7909               else if (operand_type_check (i.types[4], imm))
7910                 source = 1;
7911               else
7912                 abort ();
7913             }
7914           break;
7915         default:
7916           abort ();
7917         }
7918
7919       if (!vex_3_sources)
7920         {
7921           dest = source + 1;
7922
7923           /* RC/SAE operand could be between DEST and SRC.  That happens
7924              when one operand is GPR and the other one is XMM/YMM/ZMM
7925              register.  */
7926           if (i.rounding && i.rounding->operand == (int) dest)
7927             dest++;
7928
7929           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7930             {
7931               /* For instructions with VexNDS, the register-only source
7932                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7933                  register.  It is encoded in VEX prefix.  */
7934
7935               i386_operand_type op;
7936               unsigned int vvvv;
7937
7938               /* Swap two source operands if needed.  */
7939               if (i.tm.opcode_modifier.swapsources)
7940                 {
7941                   vvvv = source;
7942                   source = dest;
7943                 }
7944               else
7945                 vvvv = dest;
7946
7947               op = i.tm.operand_types[vvvv];
7948               if ((dest + 1) >= i.operands
7949                   || ((op.bitfield.class != Reg
7950                        || (!op.bitfield.dword && !op.bitfield.qword))
7951                       && op.bitfield.class != RegSIMD
7952                       && !operand_type_equal (&op, &regmask)))
7953                 abort ();
7954               i.vex.register_specifier = i.op[vvvv].regs;
7955               dest++;
7956             }
7957         }
7958
7959       i.rm.mode = 3;
7960       /* One of the register operands will be encoded in the i.rm.reg
7961          field, the other in the combined i.rm.mode and i.rm.regmem
7962          fields.  If no form of this instruction supports a memory
7963          destination operand, then we assume the source operand may
7964          sometimes be a memory operand and so we need to store the
7965          destination in the i.rm.reg field.  */
7966       if (!i.tm.opcode_modifier.regmem
7967           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7968         {
7969           i.rm.reg = i.op[dest].regs->reg_num;
7970           i.rm.regmem = i.op[source].regs->reg_num;
7971           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7972           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7973         }
7974       else
7975         {
7976           i.rm.reg = i.op[source].regs->reg_num;
7977           i.rm.regmem = i.op[dest].regs->reg_num;
7978           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7979           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
7980         }
7981       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7982         {
7983           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7984             abort ();
7985           i.rex &= ~REX_R;
7986           add_prefix (LOCK_PREFIX_OPCODE);
7987         }
7988     }
7989   else
7990     {                   /* If it's not 2 reg operands...  */
7991       unsigned int mem;
7992
7993       if (i.mem_operands)
7994         {
7995           unsigned int fake_zero_displacement = 0;
7996           unsigned int op;
7997
7998           for (op = 0; op < i.operands; op++)
7999             if (i.flags[op] & Operand_Mem)
8000               break;
8001           gas_assert (op < i.operands);
8002
8003           if (i.tm.opcode_modifier.sib)
8004             {
8005               /* The index register of VSIB shouldn't be RegIZ.  */
8006               if (i.tm.opcode_modifier.sib != SIBMEM
8007                   && i.index_reg->reg_num == RegIZ)
8008                 abort ();
8009
8010               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8011               if (!i.base_reg)
8012                 {
8013                   i.sib.base = NO_BASE_REGISTER;
8014                   i.sib.scale = i.log2_scale_factor;
8015                   i.types[op].bitfield.disp8 = 0;
8016                   i.types[op].bitfield.disp16 = 0;
8017                   i.types[op].bitfield.disp64 = 0;
8018                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8019                     {
8020                       /* Must be 32 bit */
8021                       i.types[op].bitfield.disp32 = 1;
8022                       i.types[op].bitfield.disp32s = 0;
8023                     }
8024                   else
8025                     {
8026                       i.types[op].bitfield.disp32 = 0;
8027                       i.types[op].bitfield.disp32s = 1;
8028                     }
8029                 }
8030
8031               /* Since the mandatory SIB always has index register, so
8032                  the code logic remains unchanged. The non-mandatory SIB
8033                  without index register is allowed and will be handled
8034                  later.  */
8035               if (i.index_reg)
8036                 {
8037                   if (i.index_reg->reg_num == RegIZ)
8038                     i.sib.index = NO_INDEX_REGISTER;
8039                   else
8040                     i.sib.index = i.index_reg->reg_num;
8041                   set_rex_vrex (i.index_reg, REX_X, FALSE);
8042                 }
8043             }
8044
8045           default_seg = &ds;
8046
8047           if (i.base_reg == 0)
8048             {
8049               i.rm.mode = 0;
8050               if (!i.disp_operands)
8051                 fake_zero_displacement = 1;
8052               if (i.index_reg == 0)
8053                 {
8054                   i386_operand_type newdisp;
8055
8056                   /* Both check for VSIB and mandatory non-vector SIB. */
8057                   gas_assert (!i.tm.opcode_modifier.sib
8058                               || i.tm.opcode_modifier.sib == SIBMEM);
8059                   /* Operand is just <disp>  */
8060                   if (flag_code == CODE_64BIT)
8061                     {
8062                       /* 64bit mode overwrites the 32bit absolute
8063                          addressing by RIP relative addressing and
8064                          absolute addressing is encoded by one of the
8065                          redundant SIB forms.  */
8066                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8067                       i.sib.base = NO_BASE_REGISTER;
8068                       i.sib.index = NO_INDEX_REGISTER;
8069                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8070                     }
8071                   else if ((flag_code == CODE_16BIT)
8072                            ^ (i.prefix[ADDR_PREFIX] != 0))
8073                     {
8074                       i.rm.regmem = NO_BASE_REGISTER_16;
8075                       newdisp = disp16;
8076                     }
8077                   else
8078                     {
8079                       i.rm.regmem = NO_BASE_REGISTER;
8080                       newdisp = disp32;
8081                     }
8082                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8083                   i.types[op] = operand_type_or (i.types[op], newdisp);
8084                 }
8085               else if (!i.tm.opcode_modifier.sib)
8086                 {
8087                   /* !i.base_reg && i.index_reg  */
8088                   if (i.index_reg->reg_num == RegIZ)
8089                     i.sib.index = NO_INDEX_REGISTER;
8090                   else
8091                     i.sib.index = i.index_reg->reg_num;
8092                   i.sib.base = NO_BASE_REGISTER;
8093                   i.sib.scale = i.log2_scale_factor;
8094                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8095                   i.types[op].bitfield.disp8 = 0;
8096                   i.types[op].bitfield.disp16 = 0;
8097                   i.types[op].bitfield.disp64 = 0;
8098                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8099                     {
8100                       /* Must be 32 bit */
8101                       i.types[op].bitfield.disp32 = 1;
8102                       i.types[op].bitfield.disp32s = 0;
8103                     }
8104                   else
8105                     {
8106                       i.types[op].bitfield.disp32 = 0;
8107                       i.types[op].bitfield.disp32s = 1;
8108                     }
8109                   if ((i.index_reg->reg_flags & RegRex) != 0)
8110                     i.rex |= REX_X;
8111                 }
8112             }
8113           /* RIP addressing for 64bit mode.  */
8114           else if (i.base_reg->reg_num == RegIP)
8115             {
8116               gas_assert (!i.tm.opcode_modifier.sib);
8117               i.rm.regmem = NO_BASE_REGISTER;
8118               i.types[op].bitfield.disp8 = 0;
8119               i.types[op].bitfield.disp16 = 0;
8120               i.types[op].bitfield.disp32 = 0;
8121               i.types[op].bitfield.disp32s = 1;
8122               i.types[op].bitfield.disp64 = 0;
8123               i.flags[op] |= Operand_PCrel;
8124               if (! i.disp_operands)
8125                 fake_zero_displacement = 1;
8126             }
8127           else if (i.base_reg->reg_type.bitfield.word)
8128             {
8129               gas_assert (!i.tm.opcode_modifier.sib);
8130               switch (i.base_reg->reg_num)
8131                 {
8132                 case 3: /* (%bx)  */
8133                   if (i.index_reg == 0)
8134                     i.rm.regmem = 7;
8135                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8136                     i.rm.regmem = i.index_reg->reg_num - 6;
8137                   break;
8138                 case 5: /* (%bp)  */
8139                   default_seg = &ss;
8140                   if (i.index_reg == 0)
8141                     {
8142                       i.rm.regmem = 6;
8143                       if (operand_type_check (i.types[op], disp) == 0)
8144                         {
8145                           /* fake (%bp) into 0(%bp)  */
8146                           if (i.disp_encoding == disp_encoding_16bit)
8147                             i.types[op].bitfield.disp16 = 1;
8148                           else
8149                             i.types[op].bitfield.disp8 = 1;
8150                           fake_zero_displacement = 1;
8151                         }
8152                     }
8153                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8154                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8155                   break;
8156                 default: /* (%si) -> 4 or (%di) -> 5  */
8157                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8158                 }
8159               if (!fake_zero_displacement
8160                   && !i.disp_operands
8161                   && i.disp_encoding)
8162                 {
8163                   fake_zero_displacement = 1;
8164                   if (i.disp_encoding == disp_encoding_8bit)
8165                     i.types[op].bitfield.disp8 = 1;
8166                   else
8167                     i.types[op].bitfield.disp16 = 1;
8168                 }
8169               i.rm.mode = mode_from_disp_size (i.types[op]);
8170             }
8171           else /* i.base_reg and 32/64 bit mode  */
8172             {
8173               if (flag_code == CODE_64BIT
8174                   && operand_type_check (i.types[op], disp))
8175                 {
8176                   i.types[op].bitfield.disp16 = 0;
8177                   i.types[op].bitfield.disp64 = 0;
8178                   if (i.prefix[ADDR_PREFIX] == 0)
8179                     {
8180                       i.types[op].bitfield.disp32 = 0;
8181                       i.types[op].bitfield.disp32s = 1;
8182                     }
8183                   else
8184                     {
8185                       i.types[op].bitfield.disp32 = 1;
8186                       i.types[op].bitfield.disp32s = 0;
8187                     }
8188                 }
8189
8190               if (!i.tm.opcode_modifier.sib)
8191                 i.rm.regmem = i.base_reg->reg_num;
8192               if ((i.base_reg->reg_flags & RegRex) != 0)
8193                 i.rex |= REX_B;
8194               i.sib.base = i.base_reg->reg_num;
8195               /* x86-64 ignores REX prefix bit here to avoid decoder
8196                  complications.  */
8197               if (!(i.base_reg->reg_flags & RegRex)
8198                   && (i.base_reg->reg_num == EBP_REG_NUM
8199                    || i.base_reg->reg_num == ESP_REG_NUM))
8200                   default_seg = &ss;
8201               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8202                 {
8203                   fake_zero_displacement = 1;
8204                   if (i.disp_encoding == disp_encoding_32bit)
8205                     i.types[op].bitfield.disp32 = 1;
8206                   else
8207                     i.types[op].bitfield.disp8 = 1;
8208                 }
8209               i.sib.scale = i.log2_scale_factor;
8210               if (i.index_reg == 0)
8211                 {
8212                   /* Only check for VSIB. */
8213                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8214                               && i.tm.opcode_modifier.sib != VECSIB256
8215                               && i.tm.opcode_modifier.sib != VECSIB512);
8216
8217                   /* <disp>(%esp) becomes two byte modrm with no index
8218                      register.  We've already stored the code for esp
8219                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8220                      Any base register besides %esp will not use the
8221                      extra modrm byte.  */
8222                   i.sib.index = NO_INDEX_REGISTER;
8223                 }
8224               else if (!i.tm.opcode_modifier.sib)
8225                 {
8226                   if (i.index_reg->reg_num == RegIZ)
8227                     i.sib.index = NO_INDEX_REGISTER;
8228                   else
8229                     i.sib.index = i.index_reg->reg_num;
8230                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8231                   if ((i.index_reg->reg_flags & RegRex) != 0)
8232                     i.rex |= REX_X;
8233                 }
8234
8235               if (i.disp_operands
8236                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8237                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8238                 i.rm.mode = 0;
8239               else
8240                 {
8241                   if (!fake_zero_displacement
8242                       && !i.disp_operands
8243                       && i.disp_encoding)
8244                     {
8245                       fake_zero_displacement = 1;
8246                       if (i.disp_encoding == disp_encoding_8bit)
8247                         i.types[op].bitfield.disp8 = 1;
8248                       else
8249                         i.types[op].bitfield.disp32 = 1;
8250                     }
8251                   i.rm.mode = mode_from_disp_size (i.types[op]);
8252                 }
8253             }
8254
8255           if (fake_zero_displacement)
8256             {
8257               /* Fakes a zero displacement assuming that i.types[op]
8258                  holds the correct displacement size.  */
8259               expressionS *exp;
8260
8261               gas_assert (i.op[op].disps == 0);
8262               exp = &disp_expressions[i.disp_operands++];
8263               i.op[op].disps = exp;
8264               exp->X_op = O_constant;
8265               exp->X_add_number = 0;
8266               exp->X_add_symbol = (symbolS *) 0;
8267               exp->X_op_symbol = (symbolS *) 0;
8268             }
8269
8270           mem = op;
8271         }
8272       else
8273         mem = ~0;
8274
8275       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8276         {
8277           if (operand_type_check (i.types[0], imm))
8278             i.vex.register_specifier = NULL;
8279           else
8280             {
8281               /* VEX.vvvv encodes one of the sources when the first
8282                  operand is not an immediate.  */
8283               if (i.tm.opcode_modifier.vexw == VEXW0)
8284                 i.vex.register_specifier = i.op[0].regs;
8285               else
8286                 i.vex.register_specifier = i.op[1].regs;
8287             }
8288
8289           /* Destination is a XMM register encoded in the ModRM.reg
8290              and VEX.R bit.  */
8291           i.rm.reg = i.op[2].regs->reg_num;
8292           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8293             i.rex |= REX_R;
8294
8295           /* ModRM.rm and VEX.B encodes the other source.  */
8296           if (!i.mem_operands)
8297             {
8298               i.rm.mode = 3;
8299
8300               if (i.tm.opcode_modifier.vexw == VEXW0)
8301                 i.rm.regmem = i.op[1].regs->reg_num;
8302               else
8303                 i.rm.regmem = i.op[0].regs->reg_num;
8304
8305               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8306                 i.rex |= REX_B;
8307             }
8308         }
8309       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8310         {
8311           i.vex.register_specifier = i.op[2].regs;
8312           if (!i.mem_operands)
8313             {
8314               i.rm.mode = 3;
8315               i.rm.regmem = i.op[1].regs->reg_num;
8316               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8317                 i.rex |= REX_B;
8318             }
8319         }
8320       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8321          (if any) based on i.tm.extension_opcode.  Again, we must be
8322          careful to make sure that segment/control/debug/test/MMX
8323          registers are coded into the i.rm.reg field.  */
8324       else if (i.reg_operands)
8325         {
8326           unsigned int op;
8327           unsigned int vex_reg = ~0;
8328
8329           for (op = 0; op < i.operands; op++)
8330             if (i.types[op].bitfield.class == Reg
8331                 || i.types[op].bitfield.class == RegBND
8332                 || i.types[op].bitfield.class == RegMask
8333                 || i.types[op].bitfield.class == SReg
8334                 || i.types[op].bitfield.class == RegCR
8335                 || i.types[op].bitfield.class == RegDR
8336                 || i.types[op].bitfield.class == RegTR
8337                 || i.types[op].bitfield.class == RegSIMD
8338                 || i.types[op].bitfield.class == RegMMX)
8339               break;
8340
8341           if (vex_3_sources)
8342             op = dest;
8343           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8344             {
8345               /* For instructions with VexNDS, the register-only
8346                  source operand is encoded in VEX prefix. */
8347               gas_assert (mem != (unsigned int) ~0);
8348
8349               if (op > mem)
8350                 {
8351                   vex_reg = op++;
8352                   gas_assert (op < i.operands);
8353                 }
8354               else
8355                 {
8356                   /* Check register-only source operand when two source
8357                      operands are swapped.  */
8358                   if (!i.tm.operand_types[op].bitfield.baseindex
8359                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8360                     {
8361                       vex_reg = op;
8362                       op += 2;
8363                       gas_assert (mem == (vex_reg + 1)
8364                                   && op < i.operands);
8365                     }
8366                   else
8367                     {
8368                       vex_reg = op + 1;
8369                       gas_assert (vex_reg < i.operands);
8370                     }
8371                 }
8372             }
8373           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8374             {
8375               /* For instructions with VexNDD, the register destination
8376                  is encoded in VEX prefix.  */
8377               if (i.mem_operands == 0)
8378                 {
8379                   /* There is no memory operand.  */
8380                   gas_assert ((op + 2) == i.operands);
8381                   vex_reg = op + 1;
8382                 }
8383               else
8384                 {
8385                   /* There are only 2 non-immediate operands.  */
8386                   gas_assert (op < i.imm_operands + 2
8387                               && i.operands == i.imm_operands + 2);
8388                   vex_reg = i.imm_operands + 1;
8389                 }
8390             }
8391           else
8392             gas_assert (op < i.operands);
8393
8394           if (vex_reg != (unsigned int) ~0)
8395             {
8396               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8397
8398               if ((type->bitfield.class != Reg
8399                    || (!type->bitfield.dword && !type->bitfield.qword))
8400                   && type->bitfield.class != RegSIMD
8401                   && !operand_type_equal (type, &regmask))
8402                 abort ();
8403
8404               i.vex.register_specifier = i.op[vex_reg].regs;
8405             }
8406
8407           /* Don't set OP operand twice.  */
8408           if (vex_reg != op)
8409             {
8410               /* If there is an extension opcode to put here, the
8411                  register number must be put into the regmem field.  */
8412               if (i.tm.extension_opcode != None)
8413                 {
8414                   i.rm.regmem = i.op[op].regs->reg_num;
8415                   set_rex_vrex (i.op[op].regs, REX_B,
8416                                 i.tm.opcode_modifier.sse2avx);
8417                 }
8418               else
8419                 {
8420                   i.rm.reg = i.op[op].regs->reg_num;
8421                   set_rex_vrex (i.op[op].regs, REX_R,
8422                                 i.tm.opcode_modifier.sse2avx);
8423                 }
8424             }
8425
8426           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8427              must set it to 3 to indicate this is a register operand
8428              in the regmem field.  */
8429           if (!i.mem_operands)
8430             i.rm.mode = 3;
8431         }
8432
8433       /* Fill in i.rm.reg field with extension opcode (if any).  */
8434       if (i.tm.extension_opcode != None)
8435         i.rm.reg = i.tm.extension_opcode;
8436     }
8437   return default_seg;
8438 }
8439
8440 static INLINE void
8441 frag_opcode_byte (unsigned char byte)
8442 {
8443   if (now_seg != absolute_section)
8444     FRAG_APPEND_1_CHAR (byte);
8445   else
8446     ++abs_section_offset;
8447 }
8448
8449 static unsigned int
8450 flip_code16 (unsigned int code16)
8451 {
8452   gas_assert (i.tm.operands == 1);
8453
8454   return !(i.prefix[REX_PREFIX] & REX_W)
8455          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8456                       || i.tm.operand_types[0].bitfield.disp32s
8457                     : i.tm.operand_types[0].bitfield.disp16)
8458          ? CODE16 : 0;
8459 }
8460
8461 static void
8462 output_branch (void)
8463 {
8464   char *p;
8465   int size;
8466   int code16;
8467   int prefix;
8468   relax_substateT subtype;
8469   symbolS *sym;
8470   offsetT off;
8471
8472   if (now_seg == absolute_section)
8473     {
8474       as_bad (_("relaxable branches not supported in absolute section"));
8475       return;
8476     }
8477
8478   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8479   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8480
8481   prefix = 0;
8482   if (i.prefix[DATA_PREFIX] != 0)
8483     {
8484       prefix = 1;
8485       i.prefixes -= 1;
8486       code16 ^= flip_code16(code16);
8487     }
8488   /* Pentium4 branch hints.  */
8489   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8490       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8491     {
8492       prefix++;
8493       i.prefixes--;
8494     }
8495   if (i.prefix[REX_PREFIX] != 0)
8496     {
8497       prefix++;
8498       i.prefixes--;
8499     }
8500
8501   /* BND prefixed jump.  */
8502   if (i.prefix[BND_PREFIX] != 0)
8503     {
8504       prefix++;
8505       i.prefixes--;
8506     }
8507
8508   if (i.prefixes != 0)
8509     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8510
8511   /* It's always a symbol;  End frag & setup for relax.
8512      Make sure there is enough room in this frag for the largest
8513      instruction we may generate in md_convert_frag.  This is 2
8514      bytes for the opcode and room for the prefix and largest
8515      displacement.  */
8516   frag_grow (prefix + 2 + 4);
8517   /* Prefix and 1 opcode byte go in fr_fix.  */
8518   p = frag_more (prefix + 1);
8519   if (i.prefix[DATA_PREFIX] != 0)
8520     *p++ = DATA_PREFIX_OPCODE;
8521   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8522       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8523     *p++ = i.prefix[SEG_PREFIX];
8524   if (i.prefix[BND_PREFIX] != 0)
8525     *p++ = BND_PREFIX_OPCODE;
8526   if (i.prefix[REX_PREFIX] != 0)
8527     *p++ = i.prefix[REX_PREFIX];
8528   *p = i.tm.base_opcode;
8529
8530   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8531     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8532   else if (cpu_arch_flags.bitfield.cpui386)
8533     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8534   else
8535     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8536   subtype |= code16;
8537
8538   sym = i.op[0].disps->X_add_symbol;
8539   off = i.op[0].disps->X_add_number;
8540
8541   if (i.op[0].disps->X_op != O_constant
8542       && i.op[0].disps->X_op != O_symbol)
8543     {
8544       /* Handle complex expressions.  */
8545       sym = make_expr_symbol (i.op[0].disps);
8546       off = 0;
8547     }
8548
8549   /* 1 possible extra opcode + 4 byte displacement go in var part.
8550      Pass reloc in fr_var.  */
8551   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8552 }
8553
8554 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8555 /* Return TRUE iff PLT32 relocation should be used for branching to
8556    symbol S.  */
8557
8558 static bfd_boolean
8559 need_plt32_p (symbolS *s)
8560 {
8561   /* PLT32 relocation is ELF only.  */
8562   if (!IS_ELF)
8563     return FALSE;
8564
8565 #ifdef TE_SOLARIS
8566   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8567      krtld support it.  */
8568   return FALSE;
8569 #endif
8570
8571   /* Since there is no need to prepare for PLT branch on x86-64, we
8572      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8573      be used as a marker for 32-bit PC-relative branches.  */
8574   if (!object_64bit)
8575     return FALSE;
8576
8577   /* Weak or undefined symbol need PLT32 relocation.  */
8578   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8579     return TRUE;
8580
8581   /* Non-global symbol doesn't need PLT32 relocation.  */
8582   if (! S_IS_EXTERNAL (s))
8583     return FALSE;
8584
8585   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8586      non-default visibilities are treated as normal global symbol
8587      so that PLT32 relocation can be used as a marker for 32-bit
8588      PC-relative branches.  It is useful for linker relaxation.  */
8589   return TRUE;
8590 }
8591 #endif
8592
8593 static void
8594 output_jump (void)
8595 {
8596   char *p;
8597   int size;
8598   fixS *fixP;
8599   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8600
8601   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8602     {
8603       /* This is a loop or jecxz type instruction.  */
8604       size = 1;
8605       if (i.prefix[ADDR_PREFIX] != 0)
8606         {
8607           frag_opcode_byte (ADDR_PREFIX_OPCODE);
8608           i.prefixes -= 1;
8609         }
8610       /* Pentium4 branch hints.  */
8611       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8612           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8613         {
8614           frag_opcode_byte (i.prefix[SEG_PREFIX]);
8615           i.prefixes--;
8616         }
8617     }
8618   else
8619     {
8620       int code16;
8621
8622       code16 = 0;
8623       if (flag_code == CODE_16BIT)
8624         code16 = CODE16;
8625
8626       if (i.prefix[DATA_PREFIX] != 0)
8627         {
8628           frag_opcode_byte (DATA_PREFIX_OPCODE);
8629           i.prefixes -= 1;
8630           code16 ^= flip_code16(code16);
8631         }
8632
8633       size = 4;
8634       if (code16)
8635         size = 2;
8636     }
8637
8638   /* BND prefixed jump.  */
8639   if (i.prefix[BND_PREFIX] != 0)
8640     {
8641       frag_opcode_byte (i.prefix[BND_PREFIX]);
8642       i.prefixes -= 1;
8643     }
8644
8645   if (i.prefix[REX_PREFIX] != 0)
8646     {
8647       frag_opcode_byte (i.prefix[REX_PREFIX]);
8648       i.prefixes -= 1;
8649     }
8650
8651   if (i.prefixes != 0)
8652     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8653
8654   if (now_seg == absolute_section)
8655     {
8656       abs_section_offset += i.tm.opcode_length + size;
8657       return;
8658     }
8659
8660   p = frag_more (i.tm.opcode_length + size);
8661   switch (i.tm.opcode_length)
8662     {
8663     case 2:
8664       *p++ = i.tm.base_opcode >> 8;
8665       /* Fall through.  */
8666     case 1:
8667       *p++ = i.tm.base_opcode;
8668       break;
8669     default:
8670       abort ();
8671     }
8672
8673 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8674   if (size == 4
8675       && jump_reloc == NO_RELOC
8676       && need_plt32_p (i.op[0].disps->X_add_symbol))
8677     jump_reloc = BFD_RELOC_X86_64_PLT32;
8678 #endif
8679
8680   jump_reloc = reloc (size, 1, 1, jump_reloc);
8681
8682   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8683                       i.op[0].disps, 1, jump_reloc);
8684
8685   /* All jumps handled here are signed, but don't use a signed limit
8686      check for 32 and 16 bit jumps as we want to allow wrap around at
8687      4G and 64k respectively.  */
8688   if (size == 1)
8689     fixP->fx_signed = 1;
8690 }
8691
8692 static void
8693 output_interseg_jump (void)
8694 {
8695   char *p;
8696   int size;
8697   int prefix;
8698   int code16;
8699
8700   code16 = 0;
8701   if (flag_code == CODE_16BIT)
8702     code16 = CODE16;
8703
8704   prefix = 0;
8705   if (i.prefix[DATA_PREFIX] != 0)
8706     {
8707       prefix = 1;
8708       i.prefixes -= 1;
8709       code16 ^= CODE16;
8710     }
8711
8712   gas_assert (!i.prefix[REX_PREFIX]);
8713
8714   size = 4;
8715   if (code16)
8716     size = 2;
8717
8718   if (i.prefixes != 0)
8719     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8720
8721   if (now_seg == absolute_section)
8722     {
8723       abs_section_offset += prefix + 1 + 2 + size;
8724       return;
8725     }
8726
8727   /* 1 opcode; 2 segment; offset  */
8728   p = frag_more (prefix + 1 + 2 + size);
8729
8730   if (i.prefix[DATA_PREFIX] != 0)
8731     *p++ = DATA_PREFIX_OPCODE;
8732
8733   if (i.prefix[REX_PREFIX] != 0)
8734     *p++ = i.prefix[REX_PREFIX];
8735
8736   *p++ = i.tm.base_opcode;
8737   if (i.op[1].imms->X_op == O_constant)
8738     {
8739       offsetT n = i.op[1].imms->X_add_number;
8740
8741       if (size == 2
8742           && !fits_in_unsigned_word (n)
8743           && !fits_in_signed_word (n))
8744         {
8745           as_bad (_("16-bit jump out of range"));
8746           return;
8747         }
8748       md_number_to_chars (p, n, size);
8749     }
8750   else
8751     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8752                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8753   if (i.op[0].imms->X_op != O_constant)
8754     as_bad (_("can't handle non absolute segment in `%s'"),
8755             i.tm.name);
8756   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8757 }
8758
8759 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8760 void
8761 x86_cleanup (void)
8762 {
8763   char *p;
8764   asection *seg = now_seg;
8765   subsegT subseg = now_subseg;
8766   asection *sec;
8767   unsigned int alignment, align_size_1;
8768   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8769   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8770   unsigned int padding;
8771
8772   if (!IS_ELF || !x86_used_note)
8773     return;
8774
8775   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8776
8777   /* The .note.gnu.property section layout:
8778
8779      Field      Length          Contents
8780      ----       ----            ----
8781      n_namsz    4               4
8782      n_descsz   4               The note descriptor size
8783      n_type     4               NT_GNU_PROPERTY_TYPE_0
8784      n_name     4               "GNU"
8785      n_desc     n_descsz        The program property array
8786      ....       ....            ....
8787    */
8788
8789   /* Create the .note.gnu.property section.  */
8790   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8791   bfd_set_section_flags (sec,
8792                          (SEC_ALLOC
8793                           | SEC_LOAD
8794                           | SEC_DATA
8795                           | SEC_HAS_CONTENTS
8796                           | SEC_READONLY));
8797
8798   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8799     {
8800       align_size_1 = 7;
8801       alignment = 3;
8802     }
8803   else
8804     {
8805       align_size_1 = 3;
8806       alignment = 2;
8807     }
8808
8809   bfd_set_section_alignment (sec, alignment);
8810   elf_section_type (sec) = SHT_NOTE;
8811
8812   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8813                                   + 4-byte data  */
8814   isa_1_descsz_raw = 4 + 4 + 4;
8815   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8816   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8817
8818   feature_2_descsz_raw = isa_1_descsz;
8819   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8820                                       + 4-byte data  */
8821   feature_2_descsz_raw += 4 + 4 + 4;
8822   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8823   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8824                       & ~align_size_1);
8825
8826   descsz = feature_2_descsz;
8827   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8828   p = frag_more (4 + 4 + 4 + 4 + descsz);
8829
8830   /* Write n_namsz.  */
8831   md_number_to_chars (p, (valueT) 4, 4);
8832
8833   /* Write n_descsz.  */
8834   md_number_to_chars (p + 4, (valueT) descsz, 4);
8835
8836   /* Write n_type.  */
8837   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8838
8839   /* Write n_name.  */
8840   memcpy (p + 4 * 3, "GNU", 4);
8841
8842   /* Write 4-byte type.  */
8843   md_number_to_chars (p + 4 * 4,
8844                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8845
8846   /* Write 4-byte data size.  */
8847   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8848
8849   /* Write 4-byte data.  */
8850   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8851
8852   /* Zero out paddings.  */
8853   padding = isa_1_descsz - isa_1_descsz_raw;
8854   if (padding)
8855     memset (p + 4 * 7, 0, padding);
8856
8857   /* Write 4-byte type.  */
8858   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8859                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8860
8861   /* Write 4-byte data size.  */
8862   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8863
8864   /* Write 4-byte data.  */
8865   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8866                       (valueT) x86_feature_2_used, 4);
8867
8868   /* Zero out paddings.  */
8869   padding = feature_2_descsz - feature_2_descsz_raw;
8870   if (padding)
8871     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8872
8873   /* We probably can't restore the current segment, for there likely
8874      isn't one yet...  */
8875   if (seg && subseg)
8876     subseg_set (seg, subseg);
8877 }
8878 #endif
8879
8880 static unsigned int
8881 encoding_length (const fragS *start_frag, offsetT start_off,
8882                  const char *frag_now_ptr)
8883 {
8884   unsigned int len = 0;
8885
8886   if (start_frag != frag_now)
8887     {
8888       const fragS *fr = start_frag;
8889
8890       do {
8891         len += fr->fr_fix;
8892         fr = fr->fr_next;
8893       } while (fr && fr != frag_now);
8894     }
8895
8896   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8897 }
8898
8899 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8900    be macro-fused with conditional jumps.
8901    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8902    or is one of the following format:
8903
8904     cmp m, imm
8905     add m, imm
8906     sub m, imm
8907    test m, imm
8908     and m, imm
8909     inc m
8910     dec m
8911
8912    it is unfusible.  */
8913
8914 static int
8915 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8916 {
8917   /* No RIP address.  */
8918   if (i.base_reg && i.base_reg->reg_num == RegIP)
8919     return 0;
8920
8921   /* No VEX/EVEX encoding.  */
8922   if (is_any_vex_encoding (&i.tm))
8923     return 0;
8924
8925   /* add, sub without add/sub m, imm.  */
8926   if (i.tm.base_opcode <= 5
8927       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8928       || ((i.tm.base_opcode | 3) == 0x83
8929           && (i.tm.extension_opcode == 0x5
8930               || i.tm.extension_opcode == 0x0)))
8931     {
8932       *mf_cmp_p = mf_cmp_alu_cmp;
8933       return !(i.mem_operands && i.imm_operands);
8934     }
8935
8936   /* and without and m, imm.  */
8937   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8938       || ((i.tm.base_opcode | 3) == 0x83
8939           && i.tm.extension_opcode == 0x4))
8940     {
8941       *mf_cmp_p = mf_cmp_test_and;
8942       return !(i.mem_operands && i.imm_operands);
8943     }
8944
8945   /* test without test m imm.  */
8946   if ((i.tm.base_opcode | 1) == 0x85
8947       || (i.tm.base_opcode | 1) == 0xa9
8948       || ((i.tm.base_opcode | 1) == 0xf7
8949           && i.tm.extension_opcode == 0))
8950     {
8951       *mf_cmp_p = mf_cmp_test_and;
8952       return !(i.mem_operands && i.imm_operands);
8953     }
8954
8955   /* cmp without cmp m, imm.  */
8956   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8957       || ((i.tm.base_opcode | 3) == 0x83
8958           && (i.tm.extension_opcode == 0x7)))
8959     {
8960       *mf_cmp_p = mf_cmp_alu_cmp;
8961       return !(i.mem_operands && i.imm_operands);
8962     }
8963
8964   /* inc, dec without inc/dec m.   */
8965   if ((i.tm.cpu_flags.bitfield.cpuno64
8966        && (i.tm.base_opcode | 0xf) == 0x4f)
8967       || ((i.tm.base_opcode | 1) == 0xff
8968           && i.tm.extension_opcode <= 0x1))
8969     {
8970       *mf_cmp_p = mf_cmp_incdec;
8971       return !i.mem_operands;
8972     }
8973
8974   return 0;
8975 }
8976
8977 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8978
8979 static int
8980 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8981 {
8982   /* NB: Don't work with COND_JUMP86 without i386.  */
8983   if (!align_branch_power
8984       || now_seg == absolute_section
8985       || !cpu_arch_flags.bitfield.cpui386
8986       || !(align_branch & align_branch_fused_bit))
8987     return 0;
8988
8989   if (maybe_fused_with_jcc_p (mf_cmp_p))
8990     {
8991       if (last_insn.kind == last_insn_other
8992           || last_insn.seg != now_seg)
8993         return 1;
8994       if (flag_debug)
8995         as_warn_where (last_insn.file, last_insn.line,
8996                        _("`%s` skips -malign-branch-boundary on `%s`"),
8997                        last_insn.name, i.tm.name);
8998     }
8999
9000   return 0;
9001 }
9002
9003 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9004
9005 static int
9006 add_branch_prefix_frag_p (void)
9007 {
9008   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9009      to PadLock instructions since they include prefixes in opcode.  */
9010   if (!align_branch_power
9011       || !align_branch_prefix_size
9012       || now_seg == absolute_section
9013       || i.tm.cpu_flags.bitfield.cpupadlock
9014       || !cpu_arch_flags.bitfield.cpui386)
9015     return 0;
9016
9017   /* Don't add prefix if it is a prefix or there is no operand in case
9018      that segment prefix is special.  */
9019   if (!i.operands || i.tm.opcode_modifier.isprefix)
9020     return 0;
9021
9022   if (last_insn.kind == last_insn_other
9023       || last_insn.seg != now_seg)
9024     return 1;
9025
9026   if (flag_debug)
9027     as_warn_where (last_insn.file, last_insn.line,
9028                    _("`%s` skips -malign-branch-boundary on `%s`"),
9029                    last_insn.name, i.tm.name);
9030
9031   return 0;
9032 }
9033
9034 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9035
9036 static int
9037 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9038                            enum mf_jcc_kind *mf_jcc_p)
9039 {
9040   int add_padding;
9041
9042   /* NB: Don't work with COND_JUMP86 without i386.  */
9043   if (!align_branch_power
9044       || now_seg == absolute_section
9045       || !cpu_arch_flags.bitfield.cpui386)
9046     return 0;
9047
9048   add_padding = 0;
9049
9050   /* Check for jcc and direct jmp.  */
9051   if (i.tm.opcode_modifier.jump == JUMP)
9052     {
9053       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9054         {
9055           *branch_p = align_branch_jmp;
9056           add_padding = align_branch & align_branch_jmp_bit;
9057         }
9058       else
9059         {
9060           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9061              igore the lowest bit.  */
9062           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9063           *branch_p = align_branch_jcc;
9064           if ((align_branch & align_branch_jcc_bit))
9065             add_padding = 1;
9066         }
9067     }
9068   else if (is_any_vex_encoding (&i.tm))
9069     return 0;
9070   else if ((i.tm.base_opcode | 1) == 0xc3)
9071     {
9072       /* Near ret.  */
9073       *branch_p = align_branch_ret;
9074       if ((align_branch & align_branch_ret_bit))
9075         add_padding = 1;
9076     }
9077   else
9078     {
9079       /* Check for indirect jmp, direct and indirect calls.  */
9080       if (i.tm.base_opcode == 0xe8)
9081         {
9082           /* Direct call.  */
9083           *branch_p = align_branch_call;
9084           if ((align_branch & align_branch_call_bit))
9085             add_padding = 1;
9086         }
9087       else if (i.tm.base_opcode == 0xff
9088                && (i.tm.extension_opcode == 2
9089                    || i.tm.extension_opcode == 4))
9090         {
9091           /* Indirect call and jmp.  */
9092           *branch_p = align_branch_indirect;
9093           if ((align_branch & align_branch_indirect_bit))
9094             add_padding = 1;
9095         }
9096
9097       if (add_padding
9098           && i.disp_operands
9099           && tls_get_addr
9100           && (i.op[0].disps->X_op == O_symbol
9101               || (i.op[0].disps->X_op == O_subtract
9102                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9103         {
9104           symbolS *s = i.op[0].disps->X_add_symbol;
9105           /* No padding to call to global or undefined tls_get_addr.  */
9106           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9107               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9108             return 0;
9109         }
9110     }
9111
9112   if (add_padding
9113       && last_insn.kind != last_insn_other
9114       && last_insn.seg == now_seg)
9115     {
9116       if (flag_debug)
9117         as_warn_where (last_insn.file, last_insn.line,
9118                        _("`%s` skips -malign-branch-boundary on `%s`"),
9119                        last_insn.name, i.tm.name);
9120       return 0;
9121     }
9122
9123   return add_padding;
9124 }
9125
9126 static void
9127 output_insn (void)
9128 {
9129   fragS *insn_start_frag;
9130   offsetT insn_start_off;
9131   fragS *fragP = NULL;
9132   enum align_branch_kind branch = align_branch_none;
9133   /* The initializer is arbitrary just to avoid uninitialized error.
9134      it's actually either assigned in add_branch_padding_frag_p
9135      or never be used.  */
9136   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9137
9138 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9139   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9140     {
9141       if (i.tm.cpu_flags.bitfield.cpucmov)
9142         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9143       if (i.tm.cpu_flags.bitfield.cpusse)
9144         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9145       if (i.tm.cpu_flags.bitfield.cpusse2)
9146         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9147       if (i.tm.cpu_flags.bitfield.cpusse3)
9148         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9149       if (i.tm.cpu_flags.bitfield.cpussse3)
9150         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9151       if (i.tm.cpu_flags.bitfield.cpusse4_1)
9152         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9153       if (i.tm.cpu_flags.bitfield.cpusse4_2)
9154         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9155       if (i.tm.cpu_flags.bitfield.cpuavx)
9156         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9157       if (i.tm.cpu_flags.bitfield.cpuavx2)
9158         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9159       if (i.tm.cpu_flags.bitfield.cpufma)
9160         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9161       if (i.tm.cpu_flags.bitfield.cpuavx512f)
9162         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9163       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9164         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9165       if (i.tm.cpu_flags.bitfield.cpuavx512er)
9166         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9167       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9168         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9169       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9170         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9171       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9172         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9173       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9174         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9175       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9176         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9177       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9178         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9179       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9180         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9181       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9182         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9183       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9184         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9185       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9186         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9187       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9188         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9189       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9190         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9191
9192       if (i.tm.cpu_flags.bitfield.cpu8087
9193           || i.tm.cpu_flags.bitfield.cpu287
9194           || i.tm.cpu_flags.bitfield.cpu387
9195           || i.tm.cpu_flags.bitfield.cpu687
9196           || i.tm.cpu_flags.bitfield.cpufisttp)
9197         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9198       if ((i.xstate & xstate_mmx)
9199           || i.tm.base_opcode == 0xf77 /* emms */
9200           || i.tm.base_opcode == 0xf0e /* femms */)
9201         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9202       if ((i.xstate & xstate_xmm))
9203         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9204       if ((i.xstate & xstate_ymm) == xstate_ymm)
9205         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9206       if ((i.xstate & xstate_zmm) == xstate_zmm)
9207         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9208       if (i.tm.cpu_flags.bitfield.cpufxsr)
9209         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9210       if (i.tm.cpu_flags.bitfield.cpuxsave)
9211         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9212       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9213         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9214       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9215         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9216
9217       if ((i.xstate & xstate_tmm) == xstate_tmm
9218           || i.tm.cpu_flags.bitfield.cpuamx_tile)
9219         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9220     }
9221 #endif
9222
9223   /* Tie dwarf2 debug info to the address at the start of the insn.
9224      We can't do this after the insn has been output as the current
9225      frag may have been closed off.  eg. by frag_var.  */
9226   dwarf2_emit_insn (0);
9227
9228   insn_start_frag = frag_now;
9229   insn_start_off = frag_now_fix ();
9230
9231   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9232     {
9233       char *p;
9234       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9235       unsigned int max_branch_padding_size = 14;
9236
9237       /* Align section to boundary.  */
9238       record_alignment (now_seg, align_branch_power);
9239
9240       /* Make room for padding.  */
9241       frag_grow (max_branch_padding_size);
9242
9243       /* Start of the padding.  */
9244       p = frag_more (0);
9245
9246       fragP = frag_now;
9247
9248       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9249                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9250                 NULL, 0, p);
9251
9252       fragP->tc_frag_data.mf_type = mf_jcc;
9253       fragP->tc_frag_data.branch_type = branch;
9254       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9255     }
9256
9257   /* Output jumps.  */
9258   if (i.tm.opcode_modifier.jump == JUMP)
9259     output_branch ();
9260   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9261            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9262     output_jump ();
9263   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9264     output_interseg_jump ();
9265   else
9266     {
9267       /* Output normal instructions here.  */
9268       char *p;
9269       unsigned char *q;
9270       unsigned int j;
9271       unsigned int prefix;
9272       enum mf_cmp_kind mf_cmp;
9273
9274       if (avoid_fence
9275           && (i.tm.base_opcode == 0xfaee8
9276               || i.tm.base_opcode == 0xfaef0
9277               || i.tm.base_opcode == 0xfaef8))
9278         {
9279           /* Encode lfence, mfence, and sfence as
9280              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9281           if (now_seg != absolute_section)
9282             {
9283               offsetT val = 0x240483f0ULL;
9284
9285               p = frag_more (5);
9286               md_number_to_chars (p, val, 5);
9287             }
9288           else
9289             abs_section_offset += 5;
9290           return;
9291         }
9292
9293       /* Some processors fail on LOCK prefix. This options makes
9294          assembler ignore LOCK prefix and serves as a workaround.  */
9295       if (omit_lock_prefix)
9296         {
9297           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9298             return;
9299           i.prefix[LOCK_PREFIX] = 0;
9300         }
9301
9302       if (branch)
9303         /* Skip if this is a branch.  */
9304         ;
9305       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9306         {
9307           /* Make room for padding.  */
9308           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9309           p = frag_more (0);
9310
9311           fragP = frag_now;
9312
9313           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9314                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9315                     NULL, 0, p);
9316
9317           fragP->tc_frag_data.mf_type = mf_cmp;
9318           fragP->tc_frag_data.branch_type = align_branch_fused;
9319           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9320         }
9321       else if (add_branch_prefix_frag_p ())
9322         {
9323           unsigned int max_prefix_size = align_branch_prefix_size;
9324
9325           /* Make room for padding.  */
9326           frag_grow (max_prefix_size);
9327           p = frag_more (0);
9328
9329           fragP = frag_now;
9330
9331           frag_var (rs_machine_dependent, max_prefix_size, 0,
9332                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9333                     NULL, 0, p);
9334
9335           fragP->tc_frag_data.max_bytes = max_prefix_size;
9336         }
9337
9338       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9339          don't need the explicit prefix.  */
9340       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9341         {
9342           switch (i.tm.opcode_length)
9343             {
9344             case 3:
9345               if (i.tm.base_opcode & 0xff000000)
9346                 {
9347                   prefix = (i.tm.base_opcode >> 24) & 0xff;
9348                   if (!i.tm.cpu_flags.bitfield.cpupadlock
9349                       || prefix != REPE_PREFIX_OPCODE
9350                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9351                     add_prefix (prefix);
9352                 }
9353               break;
9354             case 2:
9355               if ((i.tm.base_opcode & 0xff0000) != 0)
9356                 {
9357                   prefix = (i.tm.base_opcode >> 16) & 0xff;
9358                   add_prefix (prefix);
9359                 }
9360               break;
9361             case 1:
9362               break;
9363             case 0:
9364               /* Check for pseudo prefixes.  */
9365               as_bad_where (insn_start_frag->fr_file,
9366                             insn_start_frag->fr_line,
9367                              _("pseudo prefix without instruction"));
9368               return;
9369             default:
9370               abort ();
9371             }
9372
9373 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9374           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9375              R_X86_64_GOTTPOFF relocation so that linker can safely
9376              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9377              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9378              relocation for GDesc -> IE/LE optimization.  */
9379           if (x86_elf_abi == X86_64_X32_ABI
9380               && i.operands == 2
9381               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9382                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9383               && i.prefix[REX_PREFIX] == 0)
9384             add_prefix (REX_OPCODE);
9385 #endif
9386
9387           /* The prefix bytes.  */
9388           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9389             if (*q)
9390               frag_opcode_byte (*q);
9391         }
9392       else
9393         {
9394           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9395             if (*q)
9396               switch (j)
9397                 {
9398                 case SEG_PREFIX:
9399                 case ADDR_PREFIX:
9400                   frag_opcode_byte (*q);
9401                   break;
9402                 default:
9403                   /* There should be no other prefixes for instructions
9404                      with VEX prefix.  */
9405                   abort ();
9406                 }
9407
9408           /* For EVEX instructions i.vrex should become 0 after
9409              build_evex_prefix.  For VEX instructions upper 16 registers
9410              aren't available, so VREX should be 0.  */
9411           if (i.vrex)
9412             abort ();
9413           /* Now the VEX prefix.  */
9414           if (now_seg != absolute_section)
9415             {
9416               p = frag_more (i.vex.length);
9417               for (j = 0; j < i.vex.length; j++)
9418                 p[j] = i.vex.bytes[j];
9419             }
9420           else
9421             abs_section_offset += i.vex.length;
9422         }
9423
9424       /* Now the opcode; be careful about word order here!  */
9425       if (now_seg == absolute_section)
9426         abs_section_offset += i.tm.opcode_length;
9427       else if (i.tm.opcode_length == 1)
9428         {
9429           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9430         }
9431       else
9432         {
9433           switch (i.tm.opcode_length)
9434             {
9435             case 4:
9436               p = frag_more (4);
9437               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9438               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9439               break;
9440             case 3:
9441               p = frag_more (3);
9442               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9443               break;
9444             case 2:
9445               p = frag_more (2);
9446               break;
9447             default:
9448               abort ();
9449               break;
9450             }
9451
9452           /* Put out high byte first: can't use md_number_to_chars!  */
9453           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9454           *p = i.tm.base_opcode & 0xff;
9455         }
9456
9457       /* Now the modrm byte and sib byte (if present).  */
9458       if (i.tm.opcode_modifier.modrm)
9459         {
9460           frag_opcode_byte ((i.rm.regmem << 0)
9461                              | (i.rm.reg << 3)
9462                              | (i.rm.mode << 6));
9463           /* If i.rm.regmem == ESP (4)
9464              && i.rm.mode != (Register mode)
9465              && not 16 bit
9466              ==> need second modrm byte.  */
9467           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9468               && i.rm.mode != 3
9469               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9470             frag_opcode_byte ((i.sib.base << 0)
9471                               | (i.sib.index << 3)
9472                               | (i.sib.scale << 6));
9473         }
9474
9475       if (i.disp_operands)
9476         output_disp (insn_start_frag, insn_start_off);
9477
9478       if (i.imm_operands)
9479         output_imm (insn_start_frag, insn_start_off);
9480
9481       /*
9482        * frag_now_fix () returning plain abs_section_offset when we're in the
9483        * absolute section, and abs_section_offset not getting updated as data
9484        * gets added to the frag breaks the logic below.
9485        */
9486       if (now_seg != absolute_section)
9487         {
9488           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9489           if (j > 15)
9490             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9491                      j);
9492           else if (fragP)
9493             {
9494               /* NB: Don't add prefix with GOTPC relocation since
9495                  output_disp() above depends on the fixed encoding
9496                  length.  Can't add prefix with TLS relocation since
9497                  it breaks TLS linker optimization.  */
9498               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9499               /* Prefix count on the current instruction.  */
9500               unsigned int count = i.vex.length;
9501               unsigned int k;
9502               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9503                 /* REX byte is encoded in VEX/EVEX prefix.  */
9504                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9505                   count++;
9506
9507               /* Count prefixes for extended opcode maps.  */
9508               if (!i.vex.length)
9509                 switch (i.tm.opcode_length)
9510                   {
9511                   case 3:
9512                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9513                       {
9514                         count++;
9515                         switch ((i.tm.base_opcode >> 8) & 0xff)
9516                           {
9517                           case 0x38:
9518                           case 0x3a:
9519                             count++;
9520                             break;
9521                           default:
9522                             break;
9523                           }
9524                       }
9525                     break;
9526                   case 2:
9527                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9528                       count++;
9529                     break;
9530                   case 1:
9531                     break;
9532                   default:
9533                     abort ();
9534                   }
9535
9536               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9537                   == BRANCH_PREFIX)
9538                 {
9539                   /* Set the maximum prefix size in BRANCH_PREFIX
9540                      frag.  */
9541                   if (fragP->tc_frag_data.max_bytes > max)
9542                     fragP->tc_frag_data.max_bytes = max;
9543                   if (fragP->tc_frag_data.max_bytes > count)
9544                     fragP->tc_frag_data.max_bytes -= count;
9545                   else
9546                     fragP->tc_frag_data.max_bytes = 0;
9547                 }
9548               else
9549                 {
9550                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9551                      frag.  */
9552                   unsigned int max_prefix_size;
9553                   if (align_branch_prefix_size > max)
9554                     max_prefix_size = max;
9555                   else
9556                     max_prefix_size = align_branch_prefix_size;
9557                   if (max_prefix_size > count)
9558                     fragP->tc_frag_data.max_prefix_length
9559                       = max_prefix_size - count;
9560                 }
9561
9562               /* Use existing segment prefix if possible.  Use CS
9563                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9564                  segment prefix with ESP/EBP base register and use DS
9565                  segment prefix without ESP/EBP base register.  */
9566               if (i.prefix[SEG_PREFIX])
9567                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9568               else if (flag_code == CODE_64BIT)
9569                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9570               else if (i.base_reg
9571                        && (i.base_reg->reg_num == 4
9572                            || i.base_reg->reg_num == 5))
9573                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9574               else
9575                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9576             }
9577         }
9578     }
9579
9580   /* NB: Don't work with COND_JUMP86 without i386.  */
9581   if (align_branch_power
9582       && now_seg != absolute_section
9583       && cpu_arch_flags.bitfield.cpui386)
9584     {
9585       /* Terminate each frag so that we can add prefix and check for
9586          fused jcc.  */
9587       frag_wane (frag_now);
9588       frag_new (0);
9589     }
9590
9591 #ifdef DEBUG386
9592   if (flag_debug)
9593     {
9594       pi ("" /*line*/, &i);
9595     }
9596 #endif /* DEBUG386  */
9597 }
9598
9599 /* Return the size of the displacement operand N.  */
9600
9601 static int
9602 disp_size (unsigned int n)
9603 {
9604   int size = 4;
9605
9606   if (i.types[n].bitfield.disp64)
9607     size = 8;
9608   else if (i.types[n].bitfield.disp8)
9609     size = 1;
9610   else if (i.types[n].bitfield.disp16)
9611     size = 2;
9612   return size;
9613 }
9614
9615 /* Return the size of the immediate operand N.  */
9616
9617 static int
9618 imm_size (unsigned int n)
9619 {
9620   int size = 4;
9621   if (i.types[n].bitfield.imm64)
9622     size = 8;
9623   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9624     size = 1;
9625   else if (i.types[n].bitfield.imm16)
9626     size = 2;
9627   return size;
9628 }
9629
9630 static void
9631 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9632 {
9633   char *p;
9634   unsigned int n;
9635
9636   for (n = 0; n < i.operands; n++)
9637     {
9638       if (operand_type_check (i.types[n], disp))
9639         {
9640           int size = disp_size (n);
9641
9642           if (now_seg == absolute_section)
9643             abs_section_offset += size;
9644           else if (i.op[n].disps->X_op == O_constant)
9645             {
9646               offsetT val = i.op[n].disps->X_add_number;
9647
9648               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9649                                      size);
9650               p = frag_more (size);
9651               md_number_to_chars (p, val, size);
9652             }
9653           else
9654             {
9655               enum bfd_reloc_code_real reloc_type;
9656               int sign = i.types[n].bitfield.disp32s;
9657               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9658               fixS *fixP;
9659
9660               /* We can't have 8 bit displacement here.  */
9661               gas_assert (!i.types[n].bitfield.disp8);
9662
9663               /* The PC relative address is computed relative
9664                  to the instruction boundary, so in case immediate
9665                  fields follows, we need to adjust the value.  */
9666               if (pcrel && i.imm_operands)
9667                 {
9668                   unsigned int n1;
9669                   int sz = 0;
9670
9671                   for (n1 = 0; n1 < i.operands; n1++)
9672                     if (operand_type_check (i.types[n1], imm))
9673                       {
9674                         /* Only one immediate is allowed for PC
9675                            relative address.  */
9676                         gas_assert (sz == 0);
9677                         sz = imm_size (n1);
9678                         i.op[n].disps->X_add_number -= sz;
9679                       }
9680                   /* We should find the immediate.  */
9681                   gas_assert (sz != 0);
9682                 }
9683
9684               p = frag_more (size);
9685               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9686               if (GOT_symbol
9687                   && GOT_symbol == i.op[n].disps->X_add_symbol
9688                   && (((reloc_type == BFD_RELOC_32
9689                         || reloc_type == BFD_RELOC_X86_64_32S
9690                         || (reloc_type == BFD_RELOC_64
9691                             && object_64bit))
9692                        && (i.op[n].disps->X_op == O_symbol
9693                            || (i.op[n].disps->X_op == O_add
9694                                && ((symbol_get_value_expression
9695                                     (i.op[n].disps->X_op_symbol)->X_op)
9696                                    == O_subtract))))
9697                       || reloc_type == BFD_RELOC_32_PCREL))
9698                 {
9699                   if (!object_64bit)
9700                     {
9701                       reloc_type = BFD_RELOC_386_GOTPC;
9702                       i.has_gotpc_tls_reloc = TRUE;
9703                       i.op[n].imms->X_add_number +=
9704                         encoding_length (insn_start_frag, insn_start_off, p);
9705                     }
9706                   else if (reloc_type == BFD_RELOC_64)
9707                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9708                   else
9709                     /* Don't do the adjustment for x86-64, as there
9710                        the pcrel addressing is relative to the _next_
9711                        insn, and that is taken care of in other code.  */
9712                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9713                 }
9714               else if (align_branch_power)
9715                 {
9716                   switch (reloc_type)
9717                     {
9718                     case BFD_RELOC_386_TLS_GD:
9719                     case BFD_RELOC_386_TLS_LDM:
9720                     case BFD_RELOC_386_TLS_IE:
9721                     case BFD_RELOC_386_TLS_IE_32:
9722                     case BFD_RELOC_386_TLS_GOTIE:
9723                     case BFD_RELOC_386_TLS_GOTDESC:
9724                     case BFD_RELOC_386_TLS_DESC_CALL:
9725                     case BFD_RELOC_X86_64_TLSGD:
9726                     case BFD_RELOC_X86_64_TLSLD:
9727                     case BFD_RELOC_X86_64_GOTTPOFF:
9728                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9729                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9730                       i.has_gotpc_tls_reloc = TRUE;
9731                     default:
9732                       break;
9733                     }
9734                 }
9735               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9736                                   size, i.op[n].disps, pcrel,
9737                                   reloc_type);
9738               /* Check for "call/jmp *mem", "mov mem, %reg",
9739                  "test %reg, mem" and "binop mem, %reg" where binop
9740                  is one of adc, add, and, cmp, or, sbb, sub, xor
9741                  instructions without data prefix.  Always generate
9742                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9743               if (i.prefix[DATA_PREFIX] == 0
9744                   && (generate_relax_relocations
9745                       || (!object_64bit
9746                           && i.rm.mode == 0
9747                           && i.rm.regmem == 5))
9748                   && (i.rm.mode == 2
9749                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9750                   && !is_any_vex_encoding(&i.tm)
9751                   && ((i.operands == 1
9752                        && i.tm.base_opcode == 0xff
9753                        && (i.rm.reg == 2 || i.rm.reg == 4))
9754                       || (i.operands == 2
9755                           && (i.tm.base_opcode == 0x8b
9756                               || i.tm.base_opcode == 0x85
9757                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9758                 {
9759                   if (object_64bit)
9760                     {
9761                       fixP->fx_tcbit = i.rex != 0;
9762                       if (i.base_reg
9763                           && (i.base_reg->reg_num == RegIP))
9764                       fixP->fx_tcbit2 = 1;
9765                     }
9766                   else
9767                     fixP->fx_tcbit2 = 1;
9768                 }
9769             }
9770         }
9771     }
9772 }
9773
9774 static void
9775 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9776 {
9777   char *p;
9778   unsigned int n;
9779
9780   for (n = 0; n < i.operands; n++)
9781     {
9782       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9783       if (i.rounding && (int) n == i.rounding->operand)
9784         continue;
9785
9786       if (operand_type_check (i.types[n], imm))
9787         {
9788           int size = imm_size (n);
9789
9790           if (now_seg == absolute_section)
9791             abs_section_offset += size;
9792           else if (i.op[n].imms->X_op == O_constant)
9793             {
9794               offsetT val;
9795
9796               val = offset_in_range (i.op[n].imms->X_add_number,
9797                                      size);
9798               p = frag_more (size);
9799               md_number_to_chars (p, val, size);
9800             }
9801           else
9802             {
9803               /* Not absolute_section.
9804                  Need a 32-bit fixup (don't support 8bit
9805                  non-absolute imms).  Try to support other
9806                  sizes ...  */
9807               enum bfd_reloc_code_real reloc_type;
9808               int sign;
9809
9810               if (i.types[n].bitfield.imm32s
9811                   && (i.suffix == QWORD_MNEM_SUFFIX
9812                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9813                 sign = 1;
9814               else
9815                 sign = 0;
9816
9817               p = frag_more (size);
9818               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9819
9820               /*   This is tough to explain.  We end up with this one if we
9821                * have operands that look like
9822                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9823                * obtain the absolute address of the GOT, and it is strongly
9824                * preferable from a performance point of view to avoid using
9825                * a runtime relocation for this.  The actual sequence of
9826                * instructions often look something like:
9827                *
9828                *        call    .L66
9829                * .L66:
9830                *        popl    %ebx
9831                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9832                *
9833                *   The call and pop essentially return the absolute address
9834                * of the label .L66 and store it in %ebx.  The linker itself
9835                * will ultimately change the first operand of the addl so
9836                * that %ebx points to the GOT, but to keep things simple, the
9837                * .o file must have this operand set so that it generates not
9838                * the absolute address of .L66, but the absolute address of
9839                * itself.  This allows the linker itself simply treat a GOTPC
9840                * relocation as asking for a pcrel offset to the GOT to be
9841                * added in, and the addend of the relocation is stored in the
9842                * operand field for the instruction itself.
9843                *
9844                *   Our job here is to fix the operand so that it would add
9845                * the correct offset so that %ebx would point to itself.  The
9846                * thing that is tricky is that .-.L66 will point to the
9847                * beginning of the instruction, so we need to further modify
9848                * the operand so that it will point to itself.  There are
9849                * other cases where you have something like:
9850                *
9851                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9852                *
9853                * and here no correction would be required.  Internally in
9854                * the assembler we treat operands of this form as not being
9855                * pcrel since the '.' is explicitly mentioned, and I wonder
9856                * whether it would simplify matters to do it this way.  Who
9857                * knows.  In earlier versions of the PIC patches, the
9858                * pcrel_adjust field was used to store the correction, but
9859                * since the expression is not pcrel, I felt it would be
9860                * confusing to do it this way.  */
9861
9862               if ((reloc_type == BFD_RELOC_32
9863                    || reloc_type == BFD_RELOC_X86_64_32S
9864                    || reloc_type == BFD_RELOC_64)
9865                   && GOT_symbol
9866                   && GOT_symbol == i.op[n].imms->X_add_symbol
9867                   && (i.op[n].imms->X_op == O_symbol
9868                       || (i.op[n].imms->X_op == O_add
9869                           && ((symbol_get_value_expression
9870                                (i.op[n].imms->X_op_symbol)->X_op)
9871                               == O_subtract))))
9872                 {
9873                   if (!object_64bit)
9874                     reloc_type = BFD_RELOC_386_GOTPC;
9875                   else if (size == 4)
9876                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9877                   else if (size == 8)
9878                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9879                   i.has_gotpc_tls_reloc = TRUE;
9880                   i.op[n].imms->X_add_number +=
9881                     encoding_length (insn_start_frag, insn_start_off, p);
9882                 }
9883               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9884                            i.op[n].imms, 0, reloc_type);
9885             }
9886         }
9887     }
9888 }
9889 \f
9890 /* x86_cons_fix_new is called via the expression parsing code when a
9891    reloc is needed.  We use this hook to get the correct .got reloc.  */
9892 static int cons_sign = -1;
9893
9894 void
9895 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9896                   expressionS *exp, bfd_reloc_code_real_type r)
9897 {
9898   r = reloc (len, 0, cons_sign, r);
9899
9900 #ifdef TE_PE
9901   if (exp->X_op == O_secrel)
9902     {
9903       exp->X_op = O_symbol;
9904       r = BFD_RELOC_32_SECREL;
9905     }
9906 #endif
9907
9908   fix_new_exp (frag, off, len, exp, 0, r);
9909 }
9910
9911 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9912    purpose of the `.dc.a' internal pseudo-op.  */
9913
9914 int
9915 x86_address_bytes (void)
9916 {
9917   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9918     return 4;
9919   return stdoutput->arch_info->bits_per_address / 8;
9920 }
9921
9922 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9923     || defined (LEX_AT)
9924 # define lex_got(reloc, adjust, types) NULL
9925 #else
9926 /* Parse operands of the form
9927    <symbol>@GOTOFF+<nnn>
9928    and similar .plt or .got references.
9929
9930    If we find one, set up the correct relocation in RELOC and copy the
9931    input string, minus the `@GOTOFF' into a malloc'd buffer for
9932    parsing by the calling routine.  Return this buffer, and if ADJUST
9933    is non-null set it to the length of the string we removed from the
9934    input line.  Otherwise return NULL.  */
9935 static char *
9936 lex_got (enum bfd_reloc_code_real *rel,
9937          int *adjust,
9938          i386_operand_type *types)
9939 {
9940   /* Some of the relocations depend on the size of what field is to
9941      be relocated.  But in our callers i386_immediate and i386_displacement
9942      we don't yet know the operand size (this will be set by insn
9943      matching).  Hence we record the word32 relocation here,
9944      and adjust the reloc according to the real size in reloc().  */
9945   static const struct {
9946     const char *str;
9947     int len;
9948     const enum bfd_reloc_code_real rel[2];
9949     const i386_operand_type types64;
9950   } gotrel[] = {
9951 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9952     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9953                                         BFD_RELOC_SIZE32 },
9954       OPERAND_TYPE_IMM32_64 },
9955 #endif
9956     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9957                                        BFD_RELOC_X86_64_PLTOFF64 },
9958       OPERAND_TYPE_IMM64 },
9959     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9960                                        BFD_RELOC_X86_64_PLT32    },
9961       OPERAND_TYPE_IMM32_32S_DISP32 },
9962     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9963                                        BFD_RELOC_X86_64_GOTPLT64 },
9964       OPERAND_TYPE_IMM64_DISP64 },
9965     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9966                                        BFD_RELOC_X86_64_GOTOFF64 },
9967       OPERAND_TYPE_IMM64_DISP64 },
9968     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9969                                        BFD_RELOC_X86_64_GOTPCREL },
9970       OPERAND_TYPE_IMM32_32S_DISP32 },
9971     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9972                                        BFD_RELOC_X86_64_TLSGD    },
9973       OPERAND_TYPE_IMM32_32S_DISP32 },
9974     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9975                                        _dummy_first_bfd_reloc_code_real },
9976       OPERAND_TYPE_NONE },
9977     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9978                                        BFD_RELOC_X86_64_TLSLD    },
9979       OPERAND_TYPE_IMM32_32S_DISP32 },
9980     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9981                                        BFD_RELOC_X86_64_GOTTPOFF },
9982       OPERAND_TYPE_IMM32_32S_DISP32 },
9983     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9984                                        BFD_RELOC_X86_64_TPOFF32  },
9985       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9986     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9987                                        _dummy_first_bfd_reloc_code_real },
9988       OPERAND_TYPE_NONE },
9989     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9990                                        BFD_RELOC_X86_64_DTPOFF32 },
9991       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9992     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9993                                        _dummy_first_bfd_reloc_code_real },
9994       OPERAND_TYPE_NONE },
9995     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9996                                        _dummy_first_bfd_reloc_code_real },
9997       OPERAND_TYPE_NONE },
9998     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9999                                        BFD_RELOC_X86_64_GOT32    },
10000       OPERAND_TYPE_IMM32_32S_64_DISP32 },
10001     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10002                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10003       OPERAND_TYPE_IMM32_32S_DISP32 },
10004     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10005                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10006       OPERAND_TYPE_IMM32_32S_DISP32 },
10007   };
10008   char *cp;
10009   unsigned int j;
10010
10011 #if defined (OBJ_MAYBE_ELF)
10012   if (!IS_ELF)
10013     return NULL;
10014 #endif
10015
10016   for (cp = input_line_pointer; *cp != '@'; cp++)
10017     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10018       return NULL;
10019
10020   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10021     {
10022       int len = gotrel[j].len;
10023       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10024         {
10025           if (gotrel[j].rel[object_64bit] != 0)
10026             {
10027               int first, second;
10028               char *tmpbuf, *past_reloc;
10029
10030               *rel = gotrel[j].rel[object_64bit];
10031
10032               if (types)
10033                 {
10034                   if (flag_code != CODE_64BIT)
10035                     {
10036                       types->bitfield.imm32 = 1;
10037                       types->bitfield.disp32 = 1;
10038                     }
10039                   else
10040                     *types = gotrel[j].types64;
10041                 }
10042
10043               if (j != 0 && GOT_symbol == NULL)
10044                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10045
10046               /* The length of the first part of our input line.  */
10047               first = cp - input_line_pointer;
10048
10049               /* The second part goes from after the reloc token until
10050                  (and including) an end_of_line char or comma.  */
10051               past_reloc = cp + 1 + len;
10052               cp = past_reloc;
10053               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10054                 ++cp;
10055               second = cp + 1 - past_reloc;
10056
10057               /* Allocate and copy string.  The trailing NUL shouldn't
10058                  be necessary, but be safe.  */
10059               tmpbuf = XNEWVEC (char, first + second + 2);
10060               memcpy (tmpbuf, input_line_pointer, first);
10061               if (second != 0 && *past_reloc != ' ')
10062                 /* Replace the relocation token with ' ', so that
10063                    errors like foo@GOTOFF1 will be detected.  */
10064                 tmpbuf[first++] = ' ';
10065               else
10066                 /* Increment length by 1 if the relocation token is
10067                    removed.  */
10068                 len++;
10069               if (adjust)
10070                 *adjust = len;
10071               memcpy (tmpbuf + first, past_reloc, second);
10072               tmpbuf[first + second] = '\0';
10073               return tmpbuf;
10074             }
10075
10076           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10077                   gotrel[j].str, 1 << (5 + object_64bit));
10078           return NULL;
10079         }
10080     }
10081
10082   /* Might be a symbol version string.  Don't as_bad here.  */
10083   return NULL;
10084 }
10085 #endif
10086
10087 #ifdef TE_PE
10088 #ifdef lex_got
10089 #undef lex_got
10090 #endif
10091 /* Parse operands of the form
10092    <symbol>@SECREL32+<nnn>
10093
10094    If we find one, set up the correct relocation in RELOC and copy the
10095    input string, minus the `@SECREL32' into a malloc'd buffer for
10096    parsing by the calling routine.  Return this buffer, and if ADJUST
10097    is non-null set it to the length of the string we removed from the
10098    input line.  Otherwise return NULL.
10099
10100    This function is copied from the ELF version above adjusted for PE targets.  */
10101
10102 static char *
10103 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10104          int *adjust ATTRIBUTE_UNUSED,
10105          i386_operand_type *types)
10106 {
10107   static const struct
10108   {
10109     const char *str;
10110     int len;
10111     const enum bfd_reloc_code_real rel[2];
10112     const i386_operand_type types64;
10113   }
10114   gotrel[] =
10115   {
10116     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10117                                           BFD_RELOC_32_SECREL },
10118       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10119   };
10120
10121   char *cp;
10122   unsigned j;
10123
10124   for (cp = input_line_pointer; *cp != '@'; cp++)
10125     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10126       return NULL;
10127
10128   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10129     {
10130       int len = gotrel[j].len;
10131
10132       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10133         {
10134           if (gotrel[j].rel[object_64bit] != 0)
10135             {
10136               int first, second;
10137               char *tmpbuf, *past_reloc;
10138
10139               *rel = gotrel[j].rel[object_64bit];
10140               if (adjust)
10141                 *adjust = len;
10142
10143               if (types)
10144                 {
10145                   if (flag_code != CODE_64BIT)
10146                     {
10147                       types->bitfield.imm32 = 1;
10148                       types->bitfield.disp32 = 1;
10149                     }
10150                   else
10151                     *types = gotrel[j].types64;
10152                 }
10153
10154               /* The length of the first part of our input line.  */
10155               first = cp - input_line_pointer;
10156
10157               /* The second part goes from after the reloc token until
10158                  (and including) an end_of_line char or comma.  */
10159               past_reloc = cp + 1 + len;
10160               cp = past_reloc;
10161               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10162                 ++cp;
10163               second = cp + 1 - past_reloc;
10164
10165               /* Allocate and copy string.  The trailing NUL shouldn't
10166                  be necessary, but be safe.  */
10167               tmpbuf = XNEWVEC (char, first + second + 2);
10168               memcpy (tmpbuf, input_line_pointer, first);
10169               if (second != 0 && *past_reloc != ' ')
10170                 /* Replace the relocation token with ' ', so that
10171                    errors like foo@SECLREL321 will be detected.  */
10172                 tmpbuf[first++] = ' ';
10173               memcpy (tmpbuf + first, past_reloc, second);
10174               tmpbuf[first + second] = '\0';
10175               return tmpbuf;
10176             }
10177
10178           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10179                   gotrel[j].str, 1 << (5 + object_64bit));
10180           return NULL;
10181         }
10182     }
10183
10184   /* Might be a symbol version string.  Don't as_bad here.  */
10185   return NULL;
10186 }
10187
10188 #endif /* TE_PE */
10189
10190 bfd_reloc_code_real_type
10191 x86_cons (expressionS *exp, int size)
10192 {
10193   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10194
10195   intel_syntax = -intel_syntax;
10196
10197   exp->X_md = 0;
10198   if (size == 4 || (object_64bit && size == 8))
10199     {
10200       /* Handle @GOTOFF and the like in an expression.  */
10201       char *save;
10202       char *gotfree_input_line;
10203       int adjust = 0;
10204
10205       save = input_line_pointer;
10206       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10207       if (gotfree_input_line)
10208         input_line_pointer = gotfree_input_line;
10209
10210       expression (exp);
10211
10212       if (gotfree_input_line)
10213         {
10214           /* expression () has merrily parsed up to the end of line,
10215              or a comma - in the wrong buffer.  Transfer how far
10216              input_line_pointer has moved to the right buffer.  */
10217           input_line_pointer = (save
10218                                 + (input_line_pointer - gotfree_input_line)
10219                                 + adjust);
10220           free (gotfree_input_line);
10221           if (exp->X_op == O_constant
10222               || exp->X_op == O_absent
10223               || exp->X_op == O_illegal
10224               || exp->X_op == O_register
10225               || exp->X_op == O_big)
10226             {
10227               char c = *input_line_pointer;
10228               *input_line_pointer = 0;
10229               as_bad (_("missing or invalid expression `%s'"), save);
10230               *input_line_pointer = c;
10231             }
10232           else if ((got_reloc == BFD_RELOC_386_PLT32
10233                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10234                    && exp->X_op != O_symbol)
10235             {
10236               char c = *input_line_pointer;
10237               *input_line_pointer = 0;
10238               as_bad (_("invalid PLT expression `%s'"), save);
10239               *input_line_pointer = c;
10240             }
10241         }
10242     }
10243   else
10244     expression (exp);
10245
10246   intel_syntax = -intel_syntax;
10247
10248   if (intel_syntax)
10249     i386_intel_simplify (exp);
10250
10251   return got_reloc;
10252 }
10253
10254 static void
10255 signed_cons (int size)
10256 {
10257   if (flag_code == CODE_64BIT)
10258     cons_sign = 1;
10259   cons (size);
10260   cons_sign = -1;
10261 }
10262
10263 #ifdef TE_PE
10264 static void
10265 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10266 {
10267   expressionS exp;
10268
10269   do
10270     {
10271       expression (&exp);
10272       if (exp.X_op == O_symbol)
10273         exp.X_op = O_secrel;
10274
10275       emit_expr (&exp, 4);
10276     }
10277   while (*input_line_pointer++ == ',');
10278
10279   input_line_pointer--;
10280   demand_empty_rest_of_line ();
10281 }
10282 #endif
10283
10284 /* Handle Vector operations.  */
10285
10286 static char *
10287 check_VecOperations (char *op_string, char *op_end)
10288 {
10289   const reg_entry *mask;
10290   const char *saved;
10291   char *end_op;
10292
10293   while (*op_string
10294          && (op_end == NULL || op_string < op_end))
10295     {
10296       saved = op_string;
10297       if (*op_string == '{')
10298         {
10299           op_string++;
10300
10301           /* Check broadcasts.  */
10302           if (strncmp (op_string, "1to", 3) == 0)
10303             {
10304               int bcst_type;
10305
10306               if (i.broadcast)
10307                 goto duplicated_vec_op;
10308
10309               op_string += 3;
10310               if (*op_string == '8')
10311                 bcst_type = 8;
10312               else if (*op_string == '4')
10313                 bcst_type = 4;
10314               else if (*op_string == '2')
10315                 bcst_type = 2;
10316               else if (*op_string == '1'
10317                        && *(op_string+1) == '6')
10318                 {
10319                   bcst_type = 16;
10320                   op_string++;
10321                 }
10322               else
10323                 {
10324                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10325                   return NULL;
10326                 }
10327               op_string++;
10328
10329               broadcast_op.type = bcst_type;
10330               broadcast_op.operand = this_operand;
10331               broadcast_op.bytes = 0;
10332               i.broadcast = &broadcast_op;
10333             }
10334           /* Check masking operation.  */
10335           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10336             {
10337               if (mask == &bad_reg)
10338                 return NULL;
10339
10340               /* k0 can't be used for write mask.  */
10341               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10342                 {
10343                   as_bad (_("`%s%s' can't be used for write mask"),
10344                           register_prefix, mask->reg_name);
10345                   return NULL;
10346                 }
10347
10348               if (!i.mask)
10349                 {
10350                   mask_op.mask = mask;
10351                   mask_op.zeroing = 0;
10352                   mask_op.operand = this_operand;
10353                   i.mask = &mask_op;
10354                 }
10355               else
10356                 {
10357                   if (i.mask->mask)
10358                     goto duplicated_vec_op;
10359
10360                   i.mask->mask = mask;
10361
10362                   /* Only "{z}" is allowed here.  No need to check
10363                      zeroing mask explicitly.  */
10364                   if (i.mask->operand != this_operand)
10365                     {
10366                       as_bad (_("invalid write mask `%s'"), saved);
10367                       return NULL;
10368                     }
10369                 }
10370
10371               op_string = end_op;
10372             }
10373           /* Check zeroing-flag for masking operation.  */
10374           else if (*op_string == 'z')
10375             {
10376               if (!i.mask)
10377                 {
10378                   mask_op.mask = NULL;
10379                   mask_op.zeroing = 1;
10380                   mask_op.operand = this_operand;
10381                   i.mask = &mask_op;
10382                 }
10383               else
10384                 {
10385                   if (i.mask->zeroing)
10386                     {
10387                     duplicated_vec_op:
10388                       as_bad (_("duplicated `%s'"), saved);
10389                       return NULL;
10390                     }
10391
10392                   i.mask->zeroing = 1;
10393
10394                   /* Only "{%k}" is allowed here.  No need to check mask
10395                      register explicitly.  */
10396                   if (i.mask->operand != this_operand)
10397                     {
10398                       as_bad (_("invalid zeroing-masking `%s'"),
10399                               saved);
10400                       return NULL;
10401                     }
10402                 }
10403
10404               op_string++;
10405             }
10406           else
10407             goto unknown_vec_op;
10408
10409           if (*op_string != '}')
10410             {
10411               as_bad (_("missing `}' in `%s'"), saved);
10412               return NULL;
10413             }
10414           op_string++;
10415
10416           /* Strip whitespace since the addition of pseudo prefixes
10417              changed how the scrubber treats '{'.  */
10418           if (is_space_char (*op_string))
10419             ++op_string;
10420
10421           continue;
10422         }
10423     unknown_vec_op:
10424       /* We don't know this one.  */
10425       as_bad (_("unknown vector operation: `%s'"), saved);
10426       return NULL;
10427     }
10428
10429   if (i.mask && i.mask->zeroing && !i.mask->mask)
10430     {
10431       as_bad (_("zeroing-masking only allowed with write mask"));
10432       return NULL;
10433     }
10434
10435   return op_string;
10436 }
10437
10438 static int
10439 i386_immediate (char *imm_start)
10440 {
10441   char *save_input_line_pointer;
10442   char *gotfree_input_line;
10443   segT exp_seg = 0;
10444   expressionS *exp;
10445   i386_operand_type types;
10446
10447   operand_type_set (&types, ~0);
10448
10449   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10450     {
10451       as_bad (_("at most %d immediate operands are allowed"),
10452               MAX_IMMEDIATE_OPERANDS);
10453       return 0;
10454     }
10455
10456   exp = &im_expressions[i.imm_operands++];
10457   i.op[this_operand].imms = exp;
10458
10459   if (is_space_char (*imm_start))
10460     ++imm_start;
10461
10462   save_input_line_pointer = input_line_pointer;
10463   input_line_pointer = imm_start;
10464
10465   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10466   if (gotfree_input_line)
10467     input_line_pointer = gotfree_input_line;
10468
10469   exp_seg = expression (exp);
10470
10471   SKIP_WHITESPACE ();
10472
10473   /* Handle vector operations.  */
10474   if (*input_line_pointer == '{')
10475     {
10476       input_line_pointer = check_VecOperations (input_line_pointer,
10477                                                 NULL);
10478       if (input_line_pointer == NULL)
10479         return 0;
10480     }
10481
10482   if (*input_line_pointer)
10483     as_bad (_("junk `%s' after expression"), input_line_pointer);
10484
10485   input_line_pointer = save_input_line_pointer;
10486   if (gotfree_input_line)
10487     {
10488       free (gotfree_input_line);
10489
10490       if (exp->X_op == O_constant || exp->X_op == O_register)
10491         exp->X_op = O_illegal;
10492     }
10493
10494   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10495 }
10496
10497 static int
10498 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10499                          i386_operand_type types, const char *imm_start)
10500 {
10501   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10502     {
10503       if (imm_start)
10504         as_bad (_("missing or invalid immediate expression `%s'"),
10505                 imm_start);
10506       return 0;
10507     }
10508   else if (exp->X_op == O_constant)
10509     {
10510       /* Size it properly later.  */
10511       i.types[this_operand].bitfield.imm64 = 1;
10512       /* If not 64bit, sign extend val.  */
10513       if (flag_code != CODE_64BIT
10514           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10515         exp->X_add_number
10516           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10517     }
10518 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10519   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10520            && exp_seg != absolute_section
10521            && exp_seg != text_section
10522            && exp_seg != data_section
10523            && exp_seg != bss_section
10524            && exp_seg != undefined_section
10525            && !bfd_is_com_section (exp_seg))
10526     {
10527       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10528       return 0;
10529     }
10530 #endif
10531   else if (!intel_syntax && exp_seg == reg_section)
10532     {
10533       if (imm_start)
10534         as_bad (_("illegal immediate register operand %s"), imm_start);
10535       return 0;
10536     }
10537   else
10538     {
10539       /* This is an address.  The size of the address will be
10540          determined later, depending on destination register,
10541          suffix, or the default for the section.  */
10542       i.types[this_operand].bitfield.imm8 = 1;
10543       i.types[this_operand].bitfield.imm16 = 1;
10544       i.types[this_operand].bitfield.imm32 = 1;
10545       i.types[this_operand].bitfield.imm32s = 1;
10546       i.types[this_operand].bitfield.imm64 = 1;
10547       i.types[this_operand] = operand_type_and (i.types[this_operand],
10548                                                 types);
10549     }
10550
10551   return 1;
10552 }
10553
10554 static char *
10555 i386_scale (char *scale)
10556 {
10557   offsetT val;
10558   char *save = input_line_pointer;
10559
10560   input_line_pointer = scale;
10561   val = get_absolute_expression ();
10562
10563   switch (val)
10564     {
10565     case 1:
10566       i.log2_scale_factor = 0;
10567       break;
10568     case 2:
10569       i.log2_scale_factor = 1;
10570       break;
10571     case 4:
10572       i.log2_scale_factor = 2;
10573       break;
10574     case 8:
10575       i.log2_scale_factor = 3;
10576       break;
10577     default:
10578       {
10579         char sep = *input_line_pointer;
10580
10581         *input_line_pointer = '\0';
10582         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10583                 scale);
10584         *input_line_pointer = sep;
10585         input_line_pointer = save;
10586         return NULL;
10587       }
10588     }
10589   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10590     {
10591       as_warn (_("scale factor of %d without an index register"),
10592                1 << i.log2_scale_factor);
10593       i.log2_scale_factor = 0;
10594     }
10595   scale = input_line_pointer;
10596   input_line_pointer = save;
10597   return scale;
10598 }
10599
10600 static int
10601 i386_displacement (char *disp_start, char *disp_end)
10602 {
10603   expressionS *exp;
10604   segT exp_seg = 0;
10605   char *save_input_line_pointer;
10606   char *gotfree_input_line;
10607   int override;
10608   i386_operand_type bigdisp, types = anydisp;
10609   int ret;
10610
10611   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10612     {
10613       as_bad (_("at most %d displacement operands are allowed"),
10614               MAX_MEMORY_OPERANDS);
10615       return 0;
10616     }
10617
10618   operand_type_set (&bigdisp, 0);
10619   if (i.jumpabsolute
10620       || i.types[this_operand].bitfield.baseindex
10621       || (current_templates->start->opcode_modifier.jump != JUMP
10622           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10623     {
10624       i386_addressing_mode ();
10625       override = (i.prefix[ADDR_PREFIX] != 0);
10626       if (flag_code == CODE_64BIT)
10627         {
10628           if (!override)
10629             {
10630               bigdisp.bitfield.disp32s = 1;
10631               bigdisp.bitfield.disp64 = 1;
10632             }
10633           else
10634             bigdisp.bitfield.disp32 = 1;
10635         }
10636       else if ((flag_code == CODE_16BIT) ^ override)
10637           bigdisp.bitfield.disp16 = 1;
10638       else
10639           bigdisp.bitfield.disp32 = 1;
10640     }
10641   else
10642     {
10643       /* For PC-relative branches, the width of the displacement may be
10644          dependent upon data size, but is never dependent upon address size.
10645          Also make sure to not unintentionally match against a non-PC-relative
10646          branch template.  */
10647       static templates aux_templates;
10648       const insn_template *t = current_templates->start;
10649       bfd_boolean has_intel64 = FALSE;
10650
10651       aux_templates.start = t;
10652       while (++t < current_templates->end)
10653         {
10654           if (t->opcode_modifier.jump
10655               != current_templates->start->opcode_modifier.jump)
10656             break;
10657           if ((t->opcode_modifier.isa64 >= INTEL64))
10658             has_intel64 = TRUE;
10659         }
10660       if (t < current_templates->end)
10661         {
10662           aux_templates.end = t;
10663           current_templates = &aux_templates;
10664         }
10665
10666       override = (i.prefix[DATA_PREFIX] != 0);
10667       if (flag_code == CODE_64BIT)
10668         {
10669           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10670               && (!intel64 || !has_intel64))
10671             bigdisp.bitfield.disp16 = 1;
10672           else
10673             bigdisp.bitfield.disp32s = 1;
10674         }
10675       else
10676         {
10677           if (!override)
10678             override = (i.suffix == (flag_code != CODE_16BIT
10679                                      ? WORD_MNEM_SUFFIX
10680                                      : LONG_MNEM_SUFFIX));
10681           bigdisp.bitfield.disp32 = 1;
10682           if ((flag_code == CODE_16BIT) ^ override)
10683             {
10684               bigdisp.bitfield.disp32 = 0;
10685               bigdisp.bitfield.disp16 = 1;
10686             }
10687         }
10688     }
10689   i.types[this_operand] = operand_type_or (i.types[this_operand],
10690                                            bigdisp);
10691
10692   exp = &disp_expressions[i.disp_operands];
10693   i.op[this_operand].disps = exp;
10694   i.disp_operands++;
10695   save_input_line_pointer = input_line_pointer;
10696   input_line_pointer = disp_start;
10697   END_STRING_AND_SAVE (disp_end);
10698
10699 #ifndef GCC_ASM_O_HACK
10700 #define GCC_ASM_O_HACK 0
10701 #endif
10702 #if GCC_ASM_O_HACK
10703   END_STRING_AND_SAVE (disp_end + 1);
10704   if (i.types[this_operand].bitfield.baseIndex
10705       && displacement_string_end[-1] == '+')
10706     {
10707       /* This hack is to avoid a warning when using the "o"
10708          constraint within gcc asm statements.
10709          For instance:
10710
10711          #define _set_tssldt_desc(n,addr,limit,type) \
10712          __asm__ __volatile__ ( \
10713          "movw %w2,%0\n\t" \
10714          "movw %w1,2+%0\n\t" \
10715          "rorl $16,%1\n\t" \
10716          "movb %b1,4+%0\n\t" \
10717          "movb %4,5+%0\n\t" \
10718          "movb $0,6+%0\n\t" \
10719          "movb %h1,7+%0\n\t" \
10720          "rorl $16,%1" \
10721          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10722
10723          This works great except that the output assembler ends
10724          up looking a bit weird if it turns out that there is
10725          no offset.  You end up producing code that looks like:
10726
10727          #APP
10728          movw $235,(%eax)
10729          movw %dx,2+(%eax)
10730          rorl $16,%edx
10731          movb %dl,4+(%eax)
10732          movb $137,5+(%eax)
10733          movb $0,6+(%eax)
10734          movb %dh,7+(%eax)
10735          rorl $16,%edx
10736          #NO_APP
10737
10738          So here we provide the missing zero.  */
10739
10740       *displacement_string_end = '0';
10741     }
10742 #endif
10743   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10744   if (gotfree_input_line)
10745     input_line_pointer = gotfree_input_line;
10746
10747   exp_seg = expression (exp);
10748
10749   SKIP_WHITESPACE ();
10750   if (*input_line_pointer)
10751     as_bad (_("junk `%s' after expression"), input_line_pointer);
10752 #if GCC_ASM_O_HACK
10753   RESTORE_END_STRING (disp_end + 1);
10754 #endif
10755   input_line_pointer = save_input_line_pointer;
10756   if (gotfree_input_line)
10757     {
10758       free (gotfree_input_line);
10759
10760       if (exp->X_op == O_constant || exp->X_op == O_register)
10761         exp->X_op = O_illegal;
10762     }
10763
10764   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10765
10766   RESTORE_END_STRING (disp_end);
10767
10768   return ret;
10769 }
10770
10771 static int
10772 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10773                             i386_operand_type types, const char *disp_start)
10774 {
10775   i386_operand_type bigdisp;
10776   int ret = 1;
10777
10778   /* We do this to make sure that the section symbol is in
10779      the symbol table.  We will ultimately change the relocation
10780      to be relative to the beginning of the section.  */
10781   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10782       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10783       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10784     {
10785       if (exp->X_op != O_symbol)
10786         goto inv_disp;
10787
10788       if (S_IS_LOCAL (exp->X_add_symbol)
10789           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10790           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10791         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10792       exp->X_op = O_subtract;
10793       exp->X_op_symbol = GOT_symbol;
10794       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10795         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10796       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10797         i.reloc[this_operand] = BFD_RELOC_64;
10798       else
10799         i.reloc[this_operand] = BFD_RELOC_32;
10800     }
10801
10802   else if (exp->X_op == O_absent
10803            || exp->X_op == O_illegal
10804            || exp->X_op == O_big)
10805     {
10806     inv_disp:
10807       as_bad (_("missing or invalid displacement expression `%s'"),
10808               disp_start);
10809       ret = 0;
10810     }
10811
10812   else if (flag_code == CODE_64BIT
10813            && !i.prefix[ADDR_PREFIX]
10814            && exp->X_op == O_constant)
10815     {
10816       /* Since displacement is signed extended to 64bit, don't allow
10817          disp32 and turn off disp32s if they are out of range.  */
10818       i.types[this_operand].bitfield.disp32 = 0;
10819       if (!fits_in_signed_long (exp->X_add_number))
10820         {
10821           i.types[this_operand].bitfield.disp32s = 0;
10822           if (i.types[this_operand].bitfield.baseindex)
10823             {
10824               as_bad (_("0x%lx out range of signed 32bit displacement"),
10825                       (long) exp->X_add_number);
10826               ret = 0;
10827             }
10828         }
10829     }
10830
10831 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10832   else if (exp->X_op != O_constant
10833            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10834            && exp_seg != absolute_section
10835            && exp_seg != text_section
10836            && exp_seg != data_section
10837            && exp_seg != bss_section
10838            && exp_seg != undefined_section
10839            && !bfd_is_com_section (exp_seg))
10840     {
10841       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10842       ret = 0;
10843     }
10844 #endif
10845
10846   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10847       /* Constants get taken care of by optimize_disp().  */
10848       && exp->X_op != O_constant)
10849     i.types[this_operand].bitfield.disp8 = 1;
10850
10851   /* Check if this is a displacement only operand.  */
10852   bigdisp = i.types[this_operand];
10853   bigdisp.bitfield.disp8 = 0;
10854   bigdisp.bitfield.disp16 = 0;
10855   bigdisp.bitfield.disp32 = 0;
10856   bigdisp.bitfield.disp32s = 0;
10857   bigdisp.bitfield.disp64 = 0;
10858   if (operand_type_all_zero (&bigdisp))
10859     i.types[this_operand] = operand_type_and (i.types[this_operand],
10860                                               types);
10861
10862   return ret;
10863 }
10864
10865 /* Return the active addressing mode, taking address override and
10866    registers forming the address into consideration.  Update the
10867    address override prefix if necessary.  */
10868
10869 static enum flag_code
10870 i386_addressing_mode (void)
10871 {
10872   enum flag_code addr_mode;
10873
10874   if (i.prefix[ADDR_PREFIX])
10875     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10876   else if (flag_code == CODE_16BIT
10877            && current_templates->start->cpu_flags.bitfield.cpumpx
10878            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10879               from md_assemble() by "is not a valid base/index expression"
10880               when there is a base and/or index.  */
10881            && !i.types[this_operand].bitfield.baseindex)
10882     {
10883       /* MPX insn memory operands with neither base nor index must be forced
10884          to use 32-bit addressing in 16-bit mode.  */
10885       addr_mode = CODE_32BIT;
10886       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10887       ++i.prefixes;
10888       gas_assert (!i.types[this_operand].bitfield.disp16);
10889       gas_assert (!i.types[this_operand].bitfield.disp32);
10890     }
10891   else
10892     {
10893       addr_mode = flag_code;
10894
10895 #if INFER_ADDR_PREFIX
10896       if (i.mem_operands == 0)
10897         {
10898           /* Infer address prefix from the first memory operand.  */
10899           const reg_entry *addr_reg = i.base_reg;
10900
10901           if (addr_reg == NULL)
10902             addr_reg = i.index_reg;
10903
10904           if (addr_reg)
10905             {
10906               if (addr_reg->reg_type.bitfield.dword)
10907                 addr_mode = CODE_32BIT;
10908               else if (flag_code != CODE_64BIT
10909                        && addr_reg->reg_type.bitfield.word)
10910                 addr_mode = CODE_16BIT;
10911
10912               if (addr_mode != flag_code)
10913                 {
10914                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10915                   i.prefixes += 1;
10916                   /* Change the size of any displacement too.  At most one
10917                      of Disp16 or Disp32 is set.
10918                      FIXME.  There doesn't seem to be any real need for
10919                      separate Disp16 and Disp32 flags.  The same goes for
10920                      Imm16 and Imm32.  Removing them would probably clean
10921                      up the code quite a lot.  */
10922                   if (flag_code != CODE_64BIT
10923                       && (i.types[this_operand].bitfield.disp16
10924                           || i.types[this_operand].bitfield.disp32))
10925                     i.types[this_operand]
10926                       = operand_type_xor (i.types[this_operand], disp16_32);
10927                 }
10928             }
10929         }
10930 #endif
10931     }
10932
10933   return addr_mode;
10934 }
10935
10936 /* Make sure the memory operand we've been dealt is valid.
10937    Return 1 on success, 0 on a failure.  */
10938
10939 static int
10940 i386_index_check (const char *operand_string)
10941 {
10942   const char *kind = "base/index";
10943   enum flag_code addr_mode = i386_addressing_mode ();
10944
10945   if (current_templates->start->opcode_modifier.isstring
10946       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10947       && (current_templates->end[-1].opcode_modifier.isstring
10948           || i.mem_operands))
10949     {
10950       /* Memory operands of string insns are special in that they only allow
10951          a single register (rDI, rSI, or rBX) as their memory address.  */
10952       const reg_entry *expected_reg;
10953       static const char *di_si[][2] =
10954         {
10955           { "esi", "edi" },
10956           { "si", "di" },
10957           { "rsi", "rdi" }
10958         };
10959       static const char *bx[] = { "ebx", "bx", "rbx" };
10960
10961       kind = "string address";
10962
10963       if (current_templates->start->opcode_modifier.repprefixok)
10964         {
10965           int es_op = current_templates->end[-1].opcode_modifier.isstring
10966                       - IS_STRING_ES_OP0;
10967           int op = 0;
10968
10969           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10970               || ((!i.mem_operands != !intel_syntax)
10971                   && current_templates->end[-1].operand_types[1]
10972                      .bitfield.baseindex))
10973             op = 1;
10974           expected_reg
10975             = (const reg_entry *) str_hash_find (reg_hash,
10976                                                  di_si[addr_mode][op == es_op]);
10977         }
10978       else
10979         expected_reg
10980           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
10981
10982       if (i.base_reg != expected_reg
10983           || i.index_reg
10984           || operand_type_check (i.types[this_operand], disp))
10985         {
10986           /* The second memory operand must have the same size as
10987              the first one.  */
10988           if (i.mem_operands
10989               && i.base_reg
10990               && !((addr_mode == CODE_64BIT
10991                     && i.base_reg->reg_type.bitfield.qword)
10992                    || (addr_mode == CODE_32BIT
10993                        ? i.base_reg->reg_type.bitfield.dword
10994                        : i.base_reg->reg_type.bitfield.word)))
10995             goto bad_address;
10996
10997           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10998                    operand_string,
10999                    intel_syntax ? '[' : '(',
11000                    register_prefix,
11001                    expected_reg->reg_name,
11002                    intel_syntax ? ']' : ')');
11003           return 1;
11004         }
11005       else
11006         return 1;
11007
11008     bad_address:
11009       as_bad (_("`%s' is not a valid %s expression"),
11010               operand_string, kind);
11011       return 0;
11012     }
11013   else
11014     {
11015       if (addr_mode != CODE_16BIT)
11016         {
11017           /* 32-bit/64-bit checks.  */
11018           if (i.disp_encoding == disp_encoding_16bit)
11019             {
11020             bad_disp:
11021               as_bad (_("invalid `%s' prefix"),
11022                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11023               return 0;
11024             }
11025
11026           if ((i.base_reg
11027                && ((addr_mode == CODE_64BIT
11028                     ? !i.base_reg->reg_type.bitfield.qword
11029                     : !i.base_reg->reg_type.bitfield.dword)
11030                    || (i.index_reg && i.base_reg->reg_num == RegIP)
11031                    || i.base_reg->reg_num == RegIZ))
11032               || (i.index_reg
11033                   && !i.index_reg->reg_type.bitfield.xmmword
11034                   && !i.index_reg->reg_type.bitfield.ymmword
11035                   && !i.index_reg->reg_type.bitfield.zmmword
11036                   && ((addr_mode == CODE_64BIT
11037                        ? !i.index_reg->reg_type.bitfield.qword
11038                        : !i.index_reg->reg_type.bitfield.dword)
11039                       || !i.index_reg->reg_type.bitfield.baseindex)))
11040             goto bad_address;
11041
11042           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11043           if (current_templates->start->base_opcode == 0xf30f1b
11044               || (current_templates->start->base_opcode & ~1) == 0x0f1a
11045               || current_templates->start->opcode_modifier.sib == SIBMEM)
11046             {
11047               /* They cannot use RIP-relative addressing. */
11048               if (i.base_reg && i.base_reg->reg_num == RegIP)
11049                 {
11050                   as_bad (_("`%s' cannot be used here"), operand_string);
11051                   return 0;
11052                 }
11053
11054               /* bndldx and bndstx ignore their scale factor. */
11055               if ((current_templates->start->base_opcode & ~1) == 0x0f1a
11056                   && i.log2_scale_factor)
11057                 as_warn (_("register scaling is being ignored here"));
11058             }
11059         }
11060       else
11061         {
11062           /* 16-bit checks.  */
11063           if (i.disp_encoding == disp_encoding_32bit)
11064             goto bad_disp;
11065
11066           if ((i.base_reg
11067                && (!i.base_reg->reg_type.bitfield.word
11068                    || !i.base_reg->reg_type.bitfield.baseindex))
11069               || (i.index_reg
11070                   && (!i.index_reg->reg_type.bitfield.word
11071                       || !i.index_reg->reg_type.bitfield.baseindex
11072                       || !(i.base_reg
11073                            && i.base_reg->reg_num < 6
11074                            && i.index_reg->reg_num >= 6
11075                            && i.log2_scale_factor == 0))))
11076             goto bad_address;
11077         }
11078     }
11079   return 1;
11080 }
11081
11082 /* Handle vector immediates.  */
11083
11084 static int
11085 RC_SAE_immediate (const char *imm_start)
11086 {
11087   unsigned int match_found, j;
11088   const char *pstr = imm_start;
11089   expressionS *exp;
11090
11091   if (*pstr != '{')
11092     return 0;
11093
11094   pstr++;
11095   match_found = 0;
11096   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11097     {
11098       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11099         {
11100           if (!i.rounding)
11101             {
11102               rc_op.type = RC_NamesTable[j].type;
11103               rc_op.operand = this_operand;
11104               i.rounding = &rc_op;
11105             }
11106           else
11107             {
11108               as_bad (_("duplicated `%s'"), imm_start);
11109               return 0;
11110             }
11111           pstr += RC_NamesTable[j].len;
11112           match_found = 1;
11113           break;
11114         }
11115     }
11116   if (!match_found)
11117     return 0;
11118
11119   if (*pstr++ != '}')
11120     {
11121       as_bad (_("Missing '}': '%s'"), imm_start);
11122       return 0;
11123     }
11124   /* RC/SAE immediate string should contain nothing more.  */;
11125   if (*pstr != 0)
11126     {
11127       as_bad (_("Junk after '}': '%s'"), imm_start);
11128       return 0;
11129     }
11130
11131   exp = &im_expressions[i.imm_operands++];
11132   i.op[this_operand].imms = exp;
11133
11134   exp->X_op = O_constant;
11135   exp->X_add_number = 0;
11136   exp->X_add_symbol = (symbolS *) 0;
11137   exp->X_op_symbol = (symbolS *) 0;
11138
11139   i.types[this_operand].bitfield.imm8 = 1;
11140   return 1;
11141 }
11142
11143 /* Only string instructions can have a second memory operand, so
11144    reduce current_templates to just those if it contains any.  */
11145 static int
11146 maybe_adjust_templates (void)
11147 {
11148   const insn_template *t;
11149
11150   gas_assert (i.mem_operands == 1);
11151
11152   for (t = current_templates->start; t < current_templates->end; ++t)
11153     if (t->opcode_modifier.isstring)
11154       break;
11155
11156   if (t < current_templates->end)
11157     {
11158       static templates aux_templates;
11159       bfd_boolean recheck;
11160
11161       aux_templates.start = t;
11162       for (; t < current_templates->end; ++t)
11163         if (!t->opcode_modifier.isstring)
11164           break;
11165       aux_templates.end = t;
11166
11167       /* Determine whether to re-check the first memory operand.  */
11168       recheck = (aux_templates.start != current_templates->start
11169                  || t != current_templates->end);
11170
11171       current_templates = &aux_templates;
11172
11173       if (recheck)
11174         {
11175           i.mem_operands = 0;
11176           if (i.memop1_string != NULL
11177               && i386_index_check (i.memop1_string) == 0)
11178             return 0;
11179           i.mem_operands = 1;
11180         }
11181     }
11182
11183   return 1;
11184 }
11185
11186 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11187    on error.  */
11188
11189 static int
11190 i386_att_operand (char *operand_string)
11191 {
11192   const reg_entry *r;
11193   char *end_op;
11194   char *op_string = operand_string;
11195
11196   if (is_space_char (*op_string))
11197     ++op_string;
11198
11199   /* We check for an absolute prefix (differentiating,
11200      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11201   if (*op_string == ABSOLUTE_PREFIX)
11202     {
11203       ++op_string;
11204       if (is_space_char (*op_string))
11205         ++op_string;
11206       i.jumpabsolute = TRUE;
11207     }
11208
11209   /* Check if operand is a register.  */
11210   if ((r = parse_register (op_string, &end_op)) != NULL)
11211     {
11212       i386_operand_type temp;
11213
11214       if (r == &bad_reg)
11215         return 0;
11216
11217       /* Check for a segment override by searching for ':' after a
11218          segment register.  */
11219       op_string = end_op;
11220       if (is_space_char (*op_string))
11221         ++op_string;
11222       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11223         {
11224           switch (r->reg_num)
11225             {
11226             case 0:
11227               i.seg[i.mem_operands] = &es;
11228               break;
11229             case 1:
11230               i.seg[i.mem_operands] = &cs;
11231               break;
11232             case 2:
11233               i.seg[i.mem_operands] = &ss;
11234               break;
11235             case 3:
11236               i.seg[i.mem_operands] = &ds;
11237               break;
11238             case 4:
11239               i.seg[i.mem_operands] = &fs;
11240               break;
11241             case 5:
11242               i.seg[i.mem_operands] = &gs;
11243               break;
11244             }
11245
11246           /* Skip the ':' and whitespace.  */
11247           ++op_string;
11248           if (is_space_char (*op_string))
11249             ++op_string;
11250
11251           if (!is_digit_char (*op_string)
11252               && !is_identifier_char (*op_string)
11253               && *op_string != '('
11254               && *op_string != ABSOLUTE_PREFIX)
11255             {
11256               as_bad (_("bad memory operand `%s'"), op_string);
11257               return 0;
11258             }
11259           /* Handle case of %es:*foo.  */
11260           if (*op_string == ABSOLUTE_PREFIX)
11261             {
11262               ++op_string;
11263               if (is_space_char (*op_string))
11264                 ++op_string;
11265               i.jumpabsolute = TRUE;
11266             }
11267           goto do_memory_reference;
11268         }
11269
11270       /* Handle vector operations.  */
11271       if (*op_string == '{')
11272         {
11273           op_string = check_VecOperations (op_string, NULL);
11274           if (op_string == NULL)
11275             return 0;
11276         }
11277
11278       if (*op_string)
11279         {
11280           as_bad (_("junk `%s' after register"), op_string);
11281           return 0;
11282         }
11283       temp = r->reg_type;
11284       temp.bitfield.baseindex = 0;
11285       i.types[this_operand] = operand_type_or (i.types[this_operand],
11286                                                temp);
11287       i.types[this_operand].bitfield.unspecified = 0;
11288       i.op[this_operand].regs = r;
11289       i.reg_operands++;
11290     }
11291   else if (*op_string == REGISTER_PREFIX)
11292     {
11293       as_bad (_("bad register name `%s'"), op_string);
11294       return 0;
11295     }
11296   else if (*op_string == IMMEDIATE_PREFIX)
11297     {
11298       ++op_string;
11299       if (i.jumpabsolute)
11300         {
11301           as_bad (_("immediate operand illegal with absolute jump"));
11302           return 0;
11303         }
11304       if (!i386_immediate (op_string))
11305         return 0;
11306     }
11307   else if (RC_SAE_immediate (operand_string))
11308     {
11309       /* If it is a RC or SAE immediate, do nothing.  */
11310       ;
11311     }
11312   else if (is_digit_char (*op_string)
11313            || is_identifier_char (*op_string)
11314            || *op_string == '"'
11315            || *op_string == '(')
11316     {
11317       /* This is a memory reference of some sort.  */
11318       char *base_string;
11319
11320       /* Start and end of displacement string expression (if found).  */
11321       char *displacement_string_start;
11322       char *displacement_string_end;
11323       char *vop_start;
11324
11325     do_memory_reference:
11326       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11327         return 0;
11328       if ((i.mem_operands == 1
11329            && !current_templates->start->opcode_modifier.isstring)
11330           || i.mem_operands == 2)
11331         {
11332           as_bad (_("too many memory references for `%s'"),
11333                   current_templates->start->name);
11334           return 0;
11335         }
11336
11337       /* Check for base index form.  We detect the base index form by
11338          looking for an ')' at the end of the operand, searching
11339          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11340          after the '('.  */
11341       base_string = op_string + strlen (op_string);
11342
11343       /* Handle vector operations.  */
11344       vop_start = strchr (op_string, '{');
11345       if (vop_start && vop_start < base_string)
11346         {
11347           if (check_VecOperations (vop_start, base_string) == NULL)
11348             return 0;
11349           base_string = vop_start;
11350         }
11351
11352       --base_string;
11353       if (is_space_char (*base_string))
11354         --base_string;
11355
11356       /* If we only have a displacement, set-up for it to be parsed later.  */
11357       displacement_string_start = op_string;
11358       displacement_string_end = base_string + 1;
11359
11360       if (*base_string == ')')
11361         {
11362           char *temp_string;
11363           unsigned int parens_balanced = 1;
11364           /* We've already checked that the number of left & right ()'s are
11365              equal, so this loop will not be infinite.  */
11366           do
11367             {
11368               base_string--;
11369               if (*base_string == ')')
11370                 parens_balanced++;
11371               if (*base_string == '(')
11372                 parens_balanced--;
11373             }
11374           while (parens_balanced);
11375
11376           temp_string = base_string;
11377
11378           /* Skip past '(' and whitespace.  */
11379           ++base_string;
11380           if (is_space_char (*base_string))
11381             ++base_string;
11382
11383           if (*base_string == ','
11384               || ((i.base_reg = parse_register (base_string, &end_op))
11385                   != NULL))
11386             {
11387               displacement_string_end = temp_string;
11388
11389               i.types[this_operand].bitfield.baseindex = 1;
11390
11391               if (i.base_reg)
11392                 {
11393                   if (i.base_reg == &bad_reg)
11394                     return 0;
11395                   base_string = end_op;
11396                   if (is_space_char (*base_string))
11397                     ++base_string;
11398                 }
11399
11400               /* There may be an index reg or scale factor here.  */
11401               if (*base_string == ',')
11402                 {
11403                   ++base_string;
11404                   if (is_space_char (*base_string))
11405                     ++base_string;
11406
11407                   if ((i.index_reg = parse_register (base_string, &end_op))
11408                       != NULL)
11409                     {
11410                       if (i.index_reg == &bad_reg)
11411                         return 0;
11412                       base_string = end_op;
11413                       if (is_space_char (*base_string))
11414                         ++base_string;
11415                       if (*base_string == ',')
11416                         {
11417                           ++base_string;
11418                           if (is_space_char (*base_string))
11419                             ++base_string;
11420                         }
11421                       else if (*base_string != ')')
11422                         {
11423                           as_bad (_("expecting `,' or `)' "
11424                                     "after index register in `%s'"),
11425                                   operand_string);
11426                           return 0;
11427                         }
11428                     }
11429                   else if (*base_string == REGISTER_PREFIX)
11430                     {
11431                       end_op = strchr (base_string, ',');
11432                       if (end_op)
11433                         *end_op = '\0';
11434                       as_bad (_("bad register name `%s'"), base_string);
11435                       return 0;
11436                     }
11437
11438                   /* Check for scale factor.  */
11439                   if (*base_string != ')')
11440                     {
11441                       char *end_scale = i386_scale (base_string);
11442
11443                       if (!end_scale)
11444                         return 0;
11445
11446                       base_string = end_scale;
11447                       if (is_space_char (*base_string))
11448                         ++base_string;
11449                       if (*base_string != ')')
11450                         {
11451                           as_bad (_("expecting `)' "
11452                                     "after scale factor in `%s'"),
11453                                   operand_string);
11454                           return 0;
11455                         }
11456                     }
11457                   else if (!i.index_reg)
11458                     {
11459                       as_bad (_("expecting index register or scale factor "
11460                                 "after `,'; got '%c'"),
11461                               *base_string);
11462                       return 0;
11463                     }
11464                 }
11465               else if (*base_string != ')')
11466                 {
11467                   as_bad (_("expecting `,' or `)' "
11468                             "after base register in `%s'"),
11469                           operand_string);
11470                   return 0;
11471                 }
11472             }
11473           else if (*base_string == REGISTER_PREFIX)
11474             {
11475               end_op = strchr (base_string, ',');
11476               if (end_op)
11477                 *end_op = '\0';
11478               as_bad (_("bad register name `%s'"), base_string);
11479               return 0;
11480             }
11481         }
11482
11483       /* If there's an expression beginning the operand, parse it,
11484          assuming displacement_string_start and
11485          displacement_string_end are meaningful.  */
11486       if (displacement_string_start != displacement_string_end)
11487         {
11488           if (!i386_displacement (displacement_string_start,
11489                                   displacement_string_end))
11490             return 0;
11491         }
11492
11493       /* Special case for (%dx) while doing input/output op.  */
11494       if (i.base_reg
11495           && i.base_reg->reg_type.bitfield.instance == RegD
11496           && i.base_reg->reg_type.bitfield.word
11497           && i.index_reg == 0
11498           && i.log2_scale_factor == 0
11499           && i.seg[i.mem_operands] == 0
11500           && !operand_type_check (i.types[this_operand], disp))
11501         {
11502           i.types[this_operand] = i.base_reg->reg_type;
11503           return 1;
11504         }
11505
11506       if (i386_index_check (operand_string) == 0)
11507         return 0;
11508       i.flags[this_operand] |= Operand_Mem;
11509       if (i.mem_operands == 0)
11510         i.memop1_string = xstrdup (operand_string);
11511       i.mem_operands++;
11512     }
11513   else
11514     {
11515       /* It's not a memory operand; argh!  */
11516       as_bad (_("invalid char %s beginning operand %d `%s'"),
11517               output_invalid (*op_string),
11518               this_operand + 1,
11519               op_string);
11520       return 0;
11521     }
11522   return 1;                     /* Normal return.  */
11523 }
11524 \f
11525 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11526    that an rs_machine_dependent frag may reach.  */
11527
11528 unsigned int
11529 i386_frag_max_var (fragS *frag)
11530 {
11531   /* The only relaxable frags are for jumps.
11532      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11533   gas_assert (frag->fr_type == rs_machine_dependent);
11534   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11535 }
11536
11537 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11538 static int
11539 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11540 {
11541   /* STT_GNU_IFUNC symbol must go through PLT.  */
11542   if ((symbol_get_bfdsym (fr_symbol)->flags
11543        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11544     return 0;
11545
11546   if (!S_IS_EXTERNAL (fr_symbol))
11547     /* Symbol may be weak or local.  */
11548     return !S_IS_WEAK (fr_symbol);
11549
11550   /* Global symbols with non-default visibility can't be preempted. */
11551   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11552     return 1;
11553
11554   if (fr_var != NO_RELOC)
11555     switch ((enum bfd_reloc_code_real) fr_var)
11556       {
11557       case BFD_RELOC_386_PLT32:
11558       case BFD_RELOC_X86_64_PLT32:
11559         /* Symbol with PLT relocation may be preempted. */
11560         return 0;
11561       default:
11562         abort ();
11563       }
11564
11565   /* Global symbols with default visibility in a shared library may be
11566      preempted by another definition.  */
11567   return !shared;
11568 }
11569 #endif
11570
11571 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11572    Note also work for Skylake and Cascadelake.
11573 ---------------------------------------------------------------------
11574 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11575 | ------  | ----------- | ------- | -------- |
11576 |   Jo    |      N      |    N    |     Y    |
11577 |   Jno   |      N      |    N    |     Y    |
11578 |  Jc/Jb  |      Y      |    N    |     Y    |
11579 | Jae/Jnb |      Y      |    N    |     Y    |
11580 |  Je/Jz  |      Y      |    Y    |     Y    |
11581 | Jne/Jnz |      Y      |    Y    |     Y    |
11582 | Jna/Jbe |      Y      |    N    |     Y    |
11583 | Ja/Jnbe |      Y      |    N    |     Y    |
11584 |   Js    |      N      |    N    |     Y    |
11585 |   Jns   |      N      |    N    |     Y    |
11586 |  Jp/Jpe |      N      |    N    |     Y    |
11587 | Jnp/Jpo |      N      |    N    |     Y    |
11588 | Jl/Jnge |      Y      |    Y    |     Y    |
11589 | Jge/Jnl |      Y      |    Y    |     Y    |
11590 | Jle/Jng |      Y      |    Y    |     Y    |
11591 | Jg/Jnle |      Y      |    Y    |     Y    |
11592 ---------------------------------------------------------------------  */
11593 static int
11594 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11595 {
11596   if (mf_cmp == mf_cmp_alu_cmp)
11597     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11598             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11599   if (mf_cmp == mf_cmp_incdec)
11600     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11601             || mf_jcc == mf_jcc_jle);
11602   if (mf_cmp == mf_cmp_test_and)
11603     return 1;
11604   return 0;
11605 }
11606
11607 /* Return the next non-empty frag.  */
11608
11609 static fragS *
11610 i386_next_non_empty_frag (fragS *fragP)
11611 {
11612   /* There may be a frag with a ".fill 0" when there is no room in
11613      the current frag for frag_grow in output_insn.  */
11614   for (fragP = fragP->fr_next;
11615        (fragP != NULL
11616         && fragP->fr_type == rs_fill
11617         && fragP->fr_fix == 0);
11618        fragP = fragP->fr_next)
11619     ;
11620   return fragP;
11621 }
11622
11623 /* Return the next jcc frag after BRANCH_PADDING.  */
11624
11625 static fragS *
11626 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11627 {
11628   fragS *branch_fragP;
11629   if (!pad_fragP)
11630     return NULL;
11631
11632   if (pad_fragP->fr_type == rs_machine_dependent
11633       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11634           == BRANCH_PADDING))
11635     {
11636       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11637       if (branch_fragP->fr_type != rs_machine_dependent)
11638         return NULL;
11639       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11640           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11641                                    pad_fragP->tc_frag_data.mf_type))
11642         return branch_fragP;
11643     }
11644
11645   return NULL;
11646 }
11647
11648 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11649
11650 static void
11651 i386_classify_machine_dependent_frag (fragS *fragP)
11652 {
11653   fragS *cmp_fragP;
11654   fragS *pad_fragP;
11655   fragS *branch_fragP;
11656   fragS *next_fragP;
11657   unsigned int max_prefix_length;
11658
11659   if (fragP->tc_frag_data.classified)
11660     return;
11661
11662   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11663      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11664   for (next_fragP = fragP;
11665        next_fragP != NULL;
11666        next_fragP = next_fragP->fr_next)
11667     {
11668       next_fragP->tc_frag_data.classified = 1;
11669       if (next_fragP->fr_type == rs_machine_dependent)
11670         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11671           {
11672           case BRANCH_PADDING:
11673             /* The BRANCH_PADDING frag must be followed by a branch
11674                frag.  */
11675             branch_fragP = i386_next_non_empty_frag (next_fragP);
11676             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11677             break;
11678           case FUSED_JCC_PADDING:
11679             /* Check if this is a fused jcc:
11680                FUSED_JCC_PADDING
11681                CMP like instruction
11682                BRANCH_PADDING
11683                COND_JUMP
11684                */
11685             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11686             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11687             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11688             if (branch_fragP)
11689               {
11690                 /* The BRANCH_PADDING frag is merged with the
11691                    FUSED_JCC_PADDING frag.  */
11692                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11693                 /* CMP like instruction size.  */
11694                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11695                 frag_wane (pad_fragP);
11696                 /* Skip to branch_fragP.  */
11697                 next_fragP = branch_fragP;
11698               }
11699             else if (next_fragP->tc_frag_data.max_prefix_length)
11700               {
11701                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11702                    a fused jcc.  */
11703                 next_fragP->fr_subtype
11704                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11705                 next_fragP->tc_frag_data.max_bytes
11706                   = next_fragP->tc_frag_data.max_prefix_length;
11707                 /* This will be updated in the BRANCH_PREFIX scan.  */
11708                 next_fragP->tc_frag_data.max_prefix_length = 0;
11709               }
11710             else
11711               frag_wane (next_fragP);
11712             break;
11713           }
11714     }
11715
11716   /* Stop if there is no BRANCH_PREFIX.  */
11717   if (!align_branch_prefix_size)
11718     return;
11719
11720   /* Scan for BRANCH_PREFIX.  */
11721   for (; fragP != NULL; fragP = fragP->fr_next)
11722     {
11723       if (fragP->fr_type != rs_machine_dependent
11724           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11725               != BRANCH_PREFIX))
11726         continue;
11727
11728       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11729          COND_JUMP_PREFIX.  */
11730       max_prefix_length = 0;
11731       for (next_fragP = fragP;
11732            next_fragP != NULL;
11733            next_fragP = next_fragP->fr_next)
11734         {
11735           if (next_fragP->fr_type == rs_fill)
11736             /* Skip rs_fill frags.  */
11737             continue;
11738           else if (next_fragP->fr_type != rs_machine_dependent)
11739             /* Stop for all other frags.  */
11740             break;
11741
11742           /* rs_machine_dependent frags.  */
11743           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11744               == BRANCH_PREFIX)
11745             {
11746               /* Count BRANCH_PREFIX frags.  */
11747               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11748                 {
11749                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11750                   frag_wane (next_fragP);
11751                 }
11752               else
11753                 max_prefix_length
11754                   += next_fragP->tc_frag_data.max_bytes;
11755             }
11756           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11757                     == BRANCH_PADDING)
11758                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11759                        == FUSED_JCC_PADDING))
11760             {
11761               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11762               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11763               break;
11764             }
11765           else
11766             /* Stop for other rs_machine_dependent frags.  */
11767             break;
11768         }
11769
11770       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11771
11772       /* Skip to the next frag.  */
11773       fragP = next_fragP;
11774     }
11775 }
11776
11777 /* Compute padding size for
11778
11779         FUSED_JCC_PADDING
11780         CMP like instruction
11781         BRANCH_PADDING
11782         COND_JUMP/UNCOND_JUMP
11783
11784    or
11785
11786         BRANCH_PADDING
11787         COND_JUMP/UNCOND_JUMP
11788  */
11789
11790 static int
11791 i386_branch_padding_size (fragS *fragP, offsetT address)
11792 {
11793   unsigned int offset, size, padding_size;
11794   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11795
11796   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11797   if (!address)
11798     address = fragP->fr_address;
11799   address += fragP->fr_fix;
11800
11801   /* CMP like instrunction size.  */
11802   size = fragP->tc_frag_data.cmp_size;
11803
11804   /* The base size of the branch frag.  */
11805   size += branch_fragP->fr_fix;
11806
11807   /* Add opcode and displacement bytes for the rs_machine_dependent
11808      branch frag.  */
11809   if (branch_fragP->fr_type == rs_machine_dependent)
11810     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11811
11812   /* Check if branch is within boundary and doesn't end at the last
11813      byte.  */
11814   offset = address & ((1U << align_branch_power) - 1);
11815   if ((offset + size) >= (1U << align_branch_power))
11816     /* Padding needed to avoid crossing boundary.  */
11817     padding_size = (1U << align_branch_power) - offset;
11818   else
11819     /* No padding needed.  */
11820     padding_size = 0;
11821
11822   /* The return value may be saved in tc_frag_data.length which is
11823      unsigned byte.  */
11824   if (!fits_in_unsigned_byte (padding_size))
11825     abort ();
11826
11827   return padding_size;
11828 }
11829
11830 /* i386_generic_table_relax_frag()
11831
11832    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11833    grow/shrink padding to align branch frags.  Hand others to
11834    relax_frag().  */
11835
11836 long
11837 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11838 {
11839   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11840       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11841     {
11842       long padding_size = i386_branch_padding_size (fragP, 0);
11843       long grow = padding_size - fragP->tc_frag_data.length;
11844
11845       /* When the BRANCH_PREFIX frag is used, the computed address
11846          must match the actual address and there should be no padding.  */
11847       if (fragP->tc_frag_data.padding_address
11848           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11849               || padding_size))
11850         abort ();
11851
11852       /* Update the padding size.  */
11853       if (grow)
11854         fragP->tc_frag_data.length = padding_size;
11855
11856       return grow;
11857     }
11858   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11859     {
11860       fragS *padding_fragP, *next_fragP;
11861       long padding_size, left_size, last_size;
11862
11863       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11864       if (!padding_fragP)
11865         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11866         return (fragP->tc_frag_data.length
11867                 - fragP->tc_frag_data.last_length);
11868
11869       /* Compute the relative address of the padding frag in the very
11870         first time where the BRANCH_PREFIX frag sizes are zero.  */
11871       if (!fragP->tc_frag_data.padding_address)
11872         fragP->tc_frag_data.padding_address
11873           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11874
11875       /* First update the last length from the previous interation.  */
11876       left_size = fragP->tc_frag_data.prefix_length;
11877       for (next_fragP = fragP;
11878            next_fragP != padding_fragP;
11879            next_fragP = next_fragP->fr_next)
11880         if (next_fragP->fr_type == rs_machine_dependent
11881             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11882                 == BRANCH_PREFIX))
11883           {
11884             if (left_size)
11885               {
11886                 int max = next_fragP->tc_frag_data.max_bytes;
11887                 if (max)
11888                   {
11889                     int size;
11890                     if (max > left_size)
11891                       size = left_size;
11892                     else
11893                       size = max;
11894                     left_size -= size;
11895                     next_fragP->tc_frag_data.last_length = size;
11896                   }
11897               }
11898             else
11899               next_fragP->tc_frag_data.last_length = 0;
11900           }
11901
11902       /* Check the padding size for the padding frag.  */
11903       padding_size = i386_branch_padding_size
11904         (padding_fragP, (fragP->fr_address
11905                          + fragP->tc_frag_data.padding_address));
11906
11907       last_size = fragP->tc_frag_data.prefix_length;
11908       /* Check if there is change from the last interation.  */
11909       if (padding_size == last_size)
11910         {
11911           /* Update the expected address of the padding frag.  */
11912           padding_fragP->tc_frag_data.padding_address
11913             = (fragP->fr_address + padding_size
11914                + fragP->tc_frag_data.padding_address);
11915           return 0;
11916         }
11917
11918       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11919         {
11920           /* No padding if there is no sufficient room.  Clear the
11921              expected address of the padding frag.  */
11922           padding_fragP->tc_frag_data.padding_address = 0;
11923           padding_size = 0;
11924         }
11925       else
11926         /* Store the expected address of the padding frag.  */
11927         padding_fragP->tc_frag_data.padding_address
11928           = (fragP->fr_address + padding_size
11929              + fragP->tc_frag_data.padding_address);
11930
11931       fragP->tc_frag_data.prefix_length = padding_size;
11932
11933       /* Update the length for the current interation.  */
11934       left_size = padding_size;
11935       for (next_fragP = fragP;
11936            next_fragP != padding_fragP;
11937            next_fragP = next_fragP->fr_next)
11938         if (next_fragP->fr_type == rs_machine_dependent
11939             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11940                 == BRANCH_PREFIX))
11941           {
11942             if (left_size)
11943               {
11944                 int max = next_fragP->tc_frag_data.max_bytes;
11945                 if (max)
11946                   {
11947                     int size;
11948                     if (max > left_size)
11949                       size = left_size;
11950                     else
11951                       size = max;
11952                     left_size -= size;
11953                     next_fragP->tc_frag_data.length = size;
11954                   }
11955               }
11956             else
11957               next_fragP->tc_frag_data.length = 0;
11958           }
11959
11960       return (fragP->tc_frag_data.length
11961               - fragP->tc_frag_data.last_length);
11962     }
11963   return relax_frag (segment, fragP, stretch);
11964 }
11965
11966 /* md_estimate_size_before_relax()
11967
11968    Called just before relax() for rs_machine_dependent frags.  The x86
11969    assembler uses these frags to handle variable size jump
11970    instructions.
11971
11972    Any symbol that is now undefined will not become defined.
11973    Return the correct fr_subtype in the frag.
11974    Return the initial "guess for variable size of frag" to caller.
11975    The guess is actually the growth beyond the fixed part.  Whatever
11976    we do to grow the fixed or variable part contributes to our
11977    returned value.  */
11978
11979 int
11980 md_estimate_size_before_relax (fragS *fragP, segT segment)
11981 {
11982   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11983       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11984       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11985     {
11986       i386_classify_machine_dependent_frag (fragP);
11987       return fragP->tc_frag_data.length;
11988     }
11989
11990   /* We've already got fragP->fr_subtype right;  all we have to do is
11991      check for un-relaxable symbols.  On an ELF system, we can't relax
11992      an externally visible symbol, because it may be overridden by a
11993      shared library.  */
11994   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11995 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11996       || (IS_ELF
11997           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11998                                                 fragP->fr_var))
11999 #endif
12000 #if defined (OBJ_COFF) && defined (TE_PE)
12001       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12002           && S_IS_WEAK (fragP->fr_symbol))
12003 #endif
12004       )
12005     {
12006       /* Symbol is undefined in this segment, or we need to keep a
12007          reloc so that weak symbols can be overridden.  */
12008       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12009       enum bfd_reloc_code_real reloc_type;
12010       unsigned char *opcode;
12011       int old_fr_fix;
12012
12013       if (fragP->fr_var != NO_RELOC)
12014         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12015       else if (size == 2)
12016         reloc_type = BFD_RELOC_16_PCREL;
12017 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12018       else if (need_plt32_p (fragP->fr_symbol))
12019         reloc_type = BFD_RELOC_X86_64_PLT32;
12020 #endif
12021       else
12022         reloc_type = BFD_RELOC_32_PCREL;
12023
12024       old_fr_fix = fragP->fr_fix;
12025       opcode = (unsigned char *) fragP->fr_opcode;
12026
12027       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12028         {
12029         case UNCOND_JUMP:
12030           /* Make jmp (0xeb) a (d)word displacement jump.  */
12031           opcode[0] = 0xe9;
12032           fragP->fr_fix += size;
12033           fix_new (fragP, old_fr_fix, size,
12034                    fragP->fr_symbol,
12035                    fragP->fr_offset, 1,
12036                    reloc_type);
12037           break;
12038
12039         case COND_JUMP86:
12040           if (size == 2
12041               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12042             {
12043               /* Negate the condition, and branch past an
12044                  unconditional jump.  */
12045               opcode[0] ^= 1;
12046               opcode[1] = 3;
12047               /* Insert an unconditional jump.  */
12048               opcode[2] = 0xe9;
12049               /* We added two extra opcode bytes, and have a two byte
12050                  offset.  */
12051               fragP->fr_fix += 2 + 2;
12052               fix_new (fragP, old_fr_fix + 2, 2,
12053                        fragP->fr_symbol,
12054                        fragP->fr_offset, 1,
12055                        reloc_type);
12056               break;
12057             }
12058           /* Fall through.  */
12059
12060         case COND_JUMP:
12061           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12062             {
12063               fixS *fixP;
12064
12065               fragP->fr_fix += 1;
12066               fixP = fix_new (fragP, old_fr_fix, 1,
12067                               fragP->fr_symbol,
12068                               fragP->fr_offset, 1,
12069                               BFD_RELOC_8_PCREL);
12070               fixP->fx_signed = 1;
12071               break;
12072             }
12073
12074           /* This changes the byte-displacement jump 0x7N
12075              to the (d)word-displacement jump 0x0f,0x8N.  */
12076           opcode[1] = opcode[0] + 0x10;
12077           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12078           /* We've added an opcode byte.  */
12079           fragP->fr_fix += 1 + size;
12080           fix_new (fragP, old_fr_fix + 1, size,
12081                    fragP->fr_symbol,
12082                    fragP->fr_offset, 1,
12083                    reloc_type);
12084           break;
12085
12086         default:
12087           BAD_CASE (fragP->fr_subtype);
12088           break;
12089         }
12090       frag_wane (fragP);
12091       return fragP->fr_fix - old_fr_fix;
12092     }
12093
12094   /* Guess size depending on current relax state.  Initially the relax
12095      state will correspond to a short jump and we return 1, because
12096      the variable part of the frag (the branch offset) is one byte
12097      long.  However, we can relax a section more than once and in that
12098      case we must either set fr_subtype back to the unrelaxed state,
12099      or return the value for the appropriate branch.  */
12100   return md_relax_table[fragP->fr_subtype].rlx_length;
12101 }
12102
12103 /* Called after relax() is finished.
12104
12105    In:  Address of frag.
12106         fr_type == rs_machine_dependent.
12107         fr_subtype is what the address relaxed to.
12108
12109    Out: Any fixSs and constants are set up.
12110         Caller will turn frag into a ".space 0".  */
12111
12112 void
12113 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12114                  fragS *fragP)
12115 {
12116   unsigned char *opcode;
12117   unsigned char *where_to_put_displacement = NULL;
12118   offsetT target_address;
12119   offsetT opcode_address;
12120   unsigned int extension = 0;
12121   offsetT displacement_from_opcode_start;
12122
12123   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12124       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12125       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12126     {
12127       /* Generate nop padding.  */
12128       unsigned int size = fragP->tc_frag_data.length;
12129       if (size)
12130         {
12131           if (size > fragP->tc_frag_data.max_bytes)
12132             abort ();
12133
12134           if (flag_debug)
12135             {
12136               const char *msg;
12137               const char *branch = "branch";
12138               const char *prefix = "";
12139               fragS *padding_fragP;
12140               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12141                   == BRANCH_PREFIX)
12142                 {
12143                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12144                   switch (fragP->tc_frag_data.default_prefix)
12145                     {
12146                     default:
12147                       abort ();
12148                       break;
12149                     case CS_PREFIX_OPCODE:
12150                       prefix = " cs";
12151                       break;
12152                     case DS_PREFIX_OPCODE:
12153                       prefix = " ds";
12154                       break;
12155                     case ES_PREFIX_OPCODE:
12156                       prefix = " es";
12157                       break;
12158                     case FS_PREFIX_OPCODE:
12159                       prefix = " fs";
12160                       break;
12161                     case GS_PREFIX_OPCODE:
12162                       prefix = " gs";
12163                       break;
12164                     case SS_PREFIX_OPCODE:
12165                       prefix = " ss";
12166                       break;
12167                     }
12168                   if (padding_fragP)
12169                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12170                             "%s within %d-byte boundary\n");
12171                   else
12172                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12173                             "align %s within %d-byte boundary\n");
12174                 }
12175               else
12176                 {
12177                   padding_fragP = fragP;
12178                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12179                           "%s within %d-byte boundary\n");
12180                 }
12181
12182               if (padding_fragP)
12183                 switch (padding_fragP->tc_frag_data.branch_type)
12184                   {
12185                   case align_branch_jcc:
12186                     branch = "jcc";
12187                     break;
12188                   case align_branch_fused:
12189                     branch = "fused jcc";
12190                     break;
12191                   case align_branch_jmp:
12192                     branch = "jmp";
12193                     break;
12194                   case align_branch_call:
12195                     branch = "call";
12196                     break;
12197                   case align_branch_indirect:
12198                     branch = "indiret branch";
12199                     break;
12200                   case align_branch_ret:
12201                     branch = "ret";
12202                     break;
12203                   default:
12204                     break;
12205                   }
12206
12207               fprintf (stdout, msg,
12208                        fragP->fr_file, fragP->fr_line, size, prefix,
12209                        (long long) fragP->fr_address, branch,
12210                        1 << align_branch_power);
12211             }
12212           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12213             memset (fragP->fr_opcode,
12214                     fragP->tc_frag_data.default_prefix, size);
12215           else
12216             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12217                                 size, 0);
12218           fragP->fr_fix += size;
12219         }
12220       return;
12221     }
12222
12223   opcode = (unsigned char *) fragP->fr_opcode;
12224
12225   /* Address we want to reach in file space.  */
12226   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12227
12228   /* Address opcode resides at in file space.  */
12229   opcode_address = fragP->fr_address + fragP->fr_fix;
12230
12231   /* Displacement from opcode start to fill into instruction.  */
12232   displacement_from_opcode_start = target_address - opcode_address;
12233
12234   if ((fragP->fr_subtype & BIG) == 0)
12235     {
12236       /* Don't have to change opcode.  */
12237       extension = 1;            /* 1 opcode + 1 displacement  */
12238       where_to_put_displacement = &opcode[1];
12239     }
12240   else
12241     {
12242       if (no_cond_jump_promotion
12243           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12244         as_warn_where (fragP->fr_file, fragP->fr_line,
12245                        _("long jump required"));
12246
12247       switch (fragP->fr_subtype)
12248         {
12249         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12250           extension = 4;                /* 1 opcode + 4 displacement  */
12251           opcode[0] = 0xe9;
12252           where_to_put_displacement = &opcode[1];
12253           break;
12254
12255         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12256           extension = 2;                /* 1 opcode + 2 displacement  */
12257           opcode[0] = 0xe9;
12258           where_to_put_displacement = &opcode[1];
12259           break;
12260
12261         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12262         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12263           extension = 5;                /* 2 opcode + 4 displacement  */
12264           opcode[1] = opcode[0] + 0x10;
12265           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12266           where_to_put_displacement = &opcode[2];
12267           break;
12268
12269         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12270           extension = 3;                /* 2 opcode + 2 displacement  */
12271           opcode[1] = opcode[0] + 0x10;
12272           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12273           where_to_put_displacement = &opcode[2];
12274           break;
12275
12276         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12277           extension = 4;
12278           opcode[0] ^= 1;
12279           opcode[1] = 3;
12280           opcode[2] = 0xe9;
12281           where_to_put_displacement = &opcode[3];
12282           break;
12283
12284         default:
12285           BAD_CASE (fragP->fr_subtype);
12286           break;
12287         }
12288     }
12289
12290   /* If size if less then four we are sure that the operand fits,
12291      but if it's 4, then it could be that the displacement is larger
12292      then -/+ 2GB.  */
12293   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12294       && object_64bit
12295       && ((addressT) (displacement_from_opcode_start - extension
12296                       + ((addressT) 1 << 31))
12297           > (((addressT) 2 << 31) - 1)))
12298     {
12299       as_bad_where (fragP->fr_file, fragP->fr_line,
12300                     _("jump target out of range"));
12301       /* Make us emit 0.  */
12302       displacement_from_opcode_start = extension;
12303     }
12304   /* Now put displacement after opcode.  */
12305   md_number_to_chars ((char *) where_to_put_displacement,
12306                       (valueT) (displacement_from_opcode_start - extension),
12307                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12308   fragP->fr_fix += extension;
12309 }
12310 \f
12311 /* Apply a fixup (fixP) to segment data, once it has been determined
12312    by our caller that we have all the info we need to fix it up.
12313
12314    Parameter valP is the pointer to the value of the bits.
12315
12316    On the 386, immediates, displacements, and data pointers are all in
12317    the same (little-endian) format, so we don't need to care about which
12318    we are handling.  */
12319
12320 void
12321 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12322 {
12323   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12324   valueT value = *valP;
12325
12326 #if !defined (TE_Mach)
12327   if (fixP->fx_pcrel)
12328     {
12329       switch (fixP->fx_r_type)
12330         {
12331         default:
12332           break;
12333
12334         case BFD_RELOC_64:
12335           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12336           break;
12337         case BFD_RELOC_32:
12338         case BFD_RELOC_X86_64_32S:
12339           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12340           break;
12341         case BFD_RELOC_16:
12342           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12343           break;
12344         case BFD_RELOC_8:
12345           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12346           break;
12347         }
12348     }
12349
12350   if (fixP->fx_addsy != NULL
12351       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12352           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12353           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12354           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12355       && !use_rela_relocations)
12356     {
12357       /* This is a hack.  There should be a better way to handle this.
12358          This covers for the fact that bfd_install_relocation will
12359          subtract the current location (for partial_inplace, PC relative
12360          relocations); see more below.  */
12361 #ifndef OBJ_AOUT
12362       if (IS_ELF
12363 #ifdef TE_PE
12364           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12365 #endif
12366           )
12367         value += fixP->fx_where + fixP->fx_frag->fr_address;
12368 #endif
12369 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12370       if (IS_ELF)
12371         {
12372           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12373
12374           if ((sym_seg == seg
12375                || (symbol_section_p (fixP->fx_addsy)
12376                    && sym_seg != absolute_section))
12377               && !generic_force_reloc (fixP))
12378             {
12379               /* Yes, we add the values in twice.  This is because
12380                  bfd_install_relocation subtracts them out again.  I think
12381                  bfd_install_relocation is broken, but I don't dare change
12382                  it.  FIXME.  */
12383               value += fixP->fx_where + fixP->fx_frag->fr_address;
12384             }
12385         }
12386 #endif
12387 #if defined (OBJ_COFF) && defined (TE_PE)
12388       /* For some reason, the PE format does not store a
12389          section address offset for a PC relative symbol.  */
12390       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12391           || S_IS_WEAK (fixP->fx_addsy))
12392         value += md_pcrel_from (fixP);
12393 #endif
12394     }
12395 #if defined (OBJ_COFF) && defined (TE_PE)
12396   if (fixP->fx_addsy != NULL
12397       && S_IS_WEAK (fixP->fx_addsy)
12398       /* PR 16858: Do not modify weak function references.  */
12399       && ! fixP->fx_pcrel)
12400     {
12401 #if !defined (TE_PEP)
12402       /* For x86 PE weak function symbols are neither PC-relative
12403          nor do they set S_IS_FUNCTION.  So the only reliable way
12404          to detect them is to check the flags of their containing
12405          section.  */
12406       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12407           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12408         ;
12409       else
12410 #endif
12411       value -= S_GET_VALUE (fixP->fx_addsy);
12412     }
12413 #endif
12414
12415   /* Fix a few things - the dynamic linker expects certain values here,
12416      and we must not disappoint it.  */
12417 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12418   if (IS_ELF && fixP->fx_addsy)
12419     switch (fixP->fx_r_type)
12420       {
12421       case BFD_RELOC_386_PLT32:
12422       case BFD_RELOC_X86_64_PLT32:
12423         /* Make the jump instruction point to the address of the operand.
12424            At runtime we merely add the offset to the actual PLT entry.
12425            NB: Subtract the offset size only for jump instructions.  */
12426         if (fixP->fx_pcrel)
12427           value = -4;
12428         break;
12429
12430       case BFD_RELOC_386_TLS_GD:
12431       case BFD_RELOC_386_TLS_LDM:
12432       case BFD_RELOC_386_TLS_IE_32:
12433       case BFD_RELOC_386_TLS_IE:
12434       case BFD_RELOC_386_TLS_GOTIE:
12435       case BFD_RELOC_386_TLS_GOTDESC:
12436       case BFD_RELOC_X86_64_TLSGD:
12437       case BFD_RELOC_X86_64_TLSLD:
12438       case BFD_RELOC_X86_64_GOTTPOFF:
12439       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12440         value = 0; /* Fully resolved at runtime.  No addend.  */
12441         /* Fallthrough */
12442       case BFD_RELOC_386_TLS_LE:
12443       case BFD_RELOC_386_TLS_LDO_32:
12444       case BFD_RELOC_386_TLS_LE_32:
12445       case BFD_RELOC_X86_64_DTPOFF32:
12446       case BFD_RELOC_X86_64_DTPOFF64:
12447       case BFD_RELOC_X86_64_TPOFF32:
12448       case BFD_RELOC_X86_64_TPOFF64:
12449         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12450         break;
12451
12452       case BFD_RELOC_386_TLS_DESC_CALL:
12453       case BFD_RELOC_X86_64_TLSDESC_CALL:
12454         value = 0; /* Fully resolved at runtime.  No addend.  */
12455         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12456         fixP->fx_done = 0;
12457         return;
12458
12459       case BFD_RELOC_VTABLE_INHERIT:
12460       case BFD_RELOC_VTABLE_ENTRY:
12461         fixP->fx_done = 0;
12462         return;
12463
12464       default:
12465         break;
12466       }
12467 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12468   *valP = value;
12469 #endif /* !defined (TE_Mach)  */
12470
12471   /* Are we finished with this relocation now?  */
12472   if (fixP->fx_addsy == NULL)
12473     fixP->fx_done = 1;
12474 #if defined (OBJ_COFF) && defined (TE_PE)
12475   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12476     {
12477       fixP->fx_done = 0;
12478       /* Remember value for tc_gen_reloc.  */
12479       fixP->fx_addnumber = value;
12480       /* Clear out the frag for now.  */
12481       value = 0;
12482     }
12483 #endif
12484   else if (use_rela_relocations)
12485     {
12486       fixP->fx_no_overflow = 1;
12487       /* Remember value for tc_gen_reloc.  */
12488       fixP->fx_addnumber = value;
12489       value = 0;
12490     }
12491
12492   md_number_to_chars (p, value, fixP->fx_size);
12493 }
12494 \f
12495 const char *
12496 md_atof (int type, char *litP, int *sizeP)
12497 {
12498   /* This outputs the LITTLENUMs in REVERSE order;
12499      in accord with the bigendian 386.  */
12500   return ieee_md_atof (type, litP, sizeP, FALSE);
12501 }
12502 \f
12503 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12504
12505 static char *
12506 output_invalid (int c)
12507 {
12508   if (ISPRINT (c))
12509     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12510               "'%c'", c);
12511   else
12512     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12513               "(0x%x)", (unsigned char) c);
12514   return output_invalid_buf;
12515 }
12516
12517 /* Verify that @r can be used in the current context.  */
12518
12519 static bfd_boolean check_register (const reg_entry *r)
12520 {
12521   if (allow_pseudo_reg)
12522     return TRUE;
12523
12524   if (operand_type_all_zero (&r->reg_type))
12525     return FALSE;
12526
12527   if ((r->reg_type.bitfield.dword
12528        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12529        || r->reg_type.bitfield.class == RegCR
12530        || r->reg_type.bitfield.class == RegDR)
12531       && !cpu_arch_flags.bitfield.cpui386)
12532     return FALSE;
12533
12534   if (r->reg_type.bitfield.class == RegTR
12535       && (flag_code == CODE_64BIT
12536           || !cpu_arch_flags.bitfield.cpui386
12537           || cpu_arch_isa_flags.bitfield.cpui586
12538           || cpu_arch_isa_flags.bitfield.cpui686))
12539     return FALSE;
12540
12541   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12542     return FALSE;
12543
12544   if (!cpu_arch_flags.bitfield.cpuavx512f)
12545     {
12546       if (r->reg_type.bitfield.zmmword
12547           || r->reg_type.bitfield.class == RegMask)
12548         return FALSE;
12549
12550       if (!cpu_arch_flags.bitfield.cpuavx)
12551         {
12552           if (r->reg_type.bitfield.ymmword)
12553             return FALSE;
12554
12555           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12556             return FALSE;
12557         }
12558     }
12559
12560   if (r->reg_type.bitfield.tmmword
12561       && (!cpu_arch_flags.bitfield.cpuamx_tile
12562           || flag_code != CODE_64BIT))
12563     return FALSE;
12564
12565   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12566     return FALSE;
12567
12568   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12569   if (!allow_index_reg && r->reg_num == RegIZ)
12570     return FALSE;
12571
12572   /* Upper 16 vector registers are only available with VREX in 64bit
12573      mode, and require EVEX encoding.  */
12574   if (r->reg_flags & RegVRex)
12575     {
12576       if (!cpu_arch_flags.bitfield.cpuavx512f
12577           || flag_code != CODE_64BIT)
12578         return FALSE;
12579
12580       if (i.vec_encoding == vex_encoding_default)
12581         i.vec_encoding = vex_encoding_evex;
12582       else if (i.vec_encoding != vex_encoding_evex)
12583         i.vec_encoding = vex_encoding_error;
12584     }
12585
12586   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12587       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12588       && flag_code != CODE_64BIT)
12589     return FALSE;
12590
12591   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12592       && !intel_syntax)
12593     return FALSE;
12594
12595   return TRUE;
12596 }
12597
12598 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12599
12600 static const reg_entry *
12601 parse_real_register (char *reg_string, char **end_op)
12602 {
12603   char *s = reg_string;
12604   char *p;
12605   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12606   const reg_entry *r;
12607
12608   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12609   if (*s == REGISTER_PREFIX)
12610     ++s;
12611
12612   if (is_space_char (*s))
12613     ++s;
12614
12615   p = reg_name_given;
12616   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12617     {
12618       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12619         return (const reg_entry *) NULL;
12620       s++;
12621     }
12622
12623   /* For naked regs, make sure that we are not dealing with an identifier.
12624      This prevents confusing an identifier like `eax_var' with register
12625      `eax'.  */
12626   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12627     return (const reg_entry *) NULL;
12628
12629   *end_op = s;
12630
12631   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12632
12633   /* Handle floating point regs, allowing spaces in the (i) part.  */
12634   if (r == i386_regtab /* %st is first entry of table  */)
12635     {
12636       if (!cpu_arch_flags.bitfield.cpu8087
12637           && !cpu_arch_flags.bitfield.cpu287
12638           && !cpu_arch_flags.bitfield.cpu387
12639           && !allow_pseudo_reg)
12640         return (const reg_entry *) NULL;
12641
12642       if (is_space_char (*s))
12643         ++s;
12644       if (*s == '(')
12645         {
12646           ++s;
12647           if (is_space_char (*s))
12648             ++s;
12649           if (*s >= '0' && *s <= '7')
12650             {
12651               int fpr = *s - '0';
12652               ++s;
12653               if (is_space_char (*s))
12654                 ++s;
12655               if (*s == ')')
12656                 {
12657                   *end_op = s + 1;
12658                   r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12659                   know (r);
12660                   return r + fpr;
12661                 }
12662             }
12663           /* We have "%st(" then garbage.  */
12664           return (const reg_entry *) NULL;
12665         }
12666     }
12667
12668   return r && check_register (r) ? r : NULL;
12669 }
12670
12671 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12672
12673 static const reg_entry *
12674 parse_register (char *reg_string, char **end_op)
12675 {
12676   const reg_entry *r;
12677
12678   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12679     r = parse_real_register (reg_string, end_op);
12680   else
12681     r = NULL;
12682   if (!r)
12683     {
12684       char *save = input_line_pointer;
12685       char c;
12686       symbolS *symbolP;
12687
12688       input_line_pointer = reg_string;
12689       c = get_symbol_name (&reg_string);
12690       symbolP = symbol_find (reg_string);
12691       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12692         {
12693           const expressionS *e = symbol_get_value_expression (symbolP);
12694
12695           know (e->X_op == O_register);
12696           know (e->X_add_number >= 0
12697                 && (valueT) e->X_add_number < i386_regtab_size);
12698           r = i386_regtab + e->X_add_number;
12699           if (!check_register (r))
12700             {
12701               as_bad (_("register '%s%s' cannot be used here"),
12702                       register_prefix, r->reg_name);
12703               r = &bad_reg;
12704             }
12705           *end_op = input_line_pointer;
12706         }
12707       *input_line_pointer = c;
12708       input_line_pointer = save;
12709     }
12710   return r;
12711 }
12712
12713 int
12714 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12715 {
12716   const reg_entry *r;
12717   char *end = input_line_pointer;
12718
12719   *end = *nextcharP;
12720   r = parse_register (name, &input_line_pointer);
12721   if (r && end <= input_line_pointer)
12722     {
12723       *nextcharP = *input_line_pointer;
12724       *input_line_pointer = 0;
12725       if (r != &bad_reg)
12726         {
12727           e->X_op = O_register;
12728           e->X_add_number = r - i386_regtab;
12729         }
12730       else
12731           e->X_op = O_illegal;
12732       return 1;
12733     }
12734   input_line_pointer = end;
12735   *end = 0;
12736   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12737 }
12738
12739 void
12740 md_operand (expressionS *e)
12741 {
12742   char *end;
12743   const reg_entry *r;
12744
12745   switch (*input_line_pointer)
12746     {
12747     case REGISTER_PREFIX:
12748       r = parse_real_register (input_line_pointer, &end);
12749       if (r)
12750         {
12751           e->X_op = O_register;
12752           e->X_add_number = r - i386_regtab;
12753           input_line_pointer = end;
12754         }
12755       break;
12756
12757     case '[':
12758       gas_assert (intel_syntax);
12759       end = input_line_pointer++;
12760       expression (e);
12761       if (*input_line_pointer == ']')
12762         {
12763           ++input_line_pointer;
12764           e->X_op_symbol = make_expr_symbol (e);
12765           e->X_add_symbol = NULL;
12766           e->X_add_number = 0;
12767           e->X_op = O_index;
12768         }
12769       else
12770         {
12771           e->X_op = O_absent;
12772           input_line_pointer = end;
12773         }
12774       break;
12775     }
12776 }
12777
12778 \f
12779 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12780 const char *md_shortopts = "kVQ:sqnO::";
12781 #else
12782 const char *md_shortopts = "qnO::";
12783 #endif
12784
12785 #define OPTION_32 (OPTION_MD_BASE + 0)
12786 #define OPTION_64 (OPTION_MD_BASE + 1)
12787 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12788 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12789 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12790 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12791 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12792 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12793 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12794 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12795 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12796 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12797 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12798 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12799 #define OPTION_X32 (OPTION_MD_BASE + 14)
12800 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12801 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12802 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12803 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12804 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12805 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12806 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12807 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12808 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12809 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12810 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12811 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12812 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12813 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12814 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12815 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12816 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12817 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12818 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12819
12820 struct option md_longopts[] =
12821 {
12822   {"32", no_argument, NULL, OPTION_32},
12823 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12824      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12825   {"64", no_argument, NULL, OPTION_64},
12826 #endif
12827 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12828   {"x32", no_argument, NULL, OPTION_X32},
12829   {"mshared", no_argument, NULL, OPTION_MSHARED},
12830   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12831 #endif
12832   {"divide", no_argument, NULL, OPTION_DIVIDE},
12833   {"march", required_argument, NULL, OPTION_MARCH},
12834   {"mtune", required_argument, NULL, OPTION_MTUNE},
12835   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12836   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12837   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12838   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12839   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12840   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12841   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12842   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12843   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12844   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12845   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12846   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12847 # if defined (TE_PE) || defined (TE_PEP)
12848   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12849 #endif
12850   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12851   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12852   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12853   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12854   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12855   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12856   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12857   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12858   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12859   {"mlfence-before-indirect-branch", required_argument, NULL,
12860    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12861   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12862   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12863   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12864   {NULL, no_argument, NULL, 0}
12865 };
12866 size_t md_longopts_size = sizeof (md_longopts);
12867
12868 int
12869 md_parse_option (int c, const char *arg)
12870 {
12871   unsigned int j;
12872   char *arch, *next, *saved, *type;
12873
12874   switch (c)
12875     {
12876     case 'n':
12877       optimize_align_code = 0;
12878       break;
12879
12880     case 'q':
12881       quiet_warnings = 1;
12882       break;
12883
12884 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12885       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12886          should be emitted or not.  FIXME: Not implemented.  */
12887     case 'Q':
12888       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12889         return 0;
12890       break;
12891
12892       /* -V: SVR4 argument to print version ID.  */
12893     case 'V':
12894       print_version_id ();
12895       break;
12896
12897       /* -k: Ignore for FreeBSD compatibility.  */
12898     case 'k':
12899       break;
12900
12901     case 's':
12902       /* -s: On i386 Solaris, this tells the native assembler to use
12903          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12904       break;
12905
12906     case OPTION_MSHARED:
12907       shared = 1;
12908       break;
12909
12910     case OPTION_X86_USED_NOTE:
12911       if (strcasecmp (arg, "yes") == 0)
12912         x86_used_note = 1;
12913       else if (strcasecmp (arg, "no") == 0)
12914         x86_used_note = 0;
12915       else
12916         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12917       break;
12918
12919
12920 #endif
12921 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12922      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12923     case OPTION_64:
12924       {
12925         const char **list, **l;
12926
12927         list = bfd_target_list ();
12928         for (l = list; *l != NULL; l++)
12929           if (CONST_STRNEQ (*l, "elf64-x86-64")
12930               || strcmp (*l, "coff-x86-64") == 0
12931               || strcmp (*l, "pe-x86-64") == 0
12932               || strcmp (*l, "pei-x86-64") == 0
12933               || strcmp (*l, "mach-o-x86-64") == 0)
12934             {
12935               default_arch = "x86_64";
12936               break;
12937             }
12938         if (*l == NULL)
12939           as_fatal (_("no compiled in support for x86_64"));
12940         free (list);
12941       }
12942       break;
12943 #endif
12944
12945 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12946     case OPTION_X32:
12947       if (IS_ELF)
12948         {
12949           const char **list, **l;
12950
12951           list = bfd_target_list ();
12952           for (l = list; *l != NULL; l++)
12953             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12954               {
12955                 default_arch = "x86_64:32";
12956                 break;
12957               }
12958           if (*l == NULL)
12959             as_fatal (_("no compiled in support for 32bit x86_64"));
12960           free (list);
12961         }
12962       else
12963         as_fatal (_("32bit x86_64 is only supported for ELF"));
12964       break;
12965 #endif
12966
12967     case OPTION_32:
12968       default_arch = "i386";
12969       break;
12970
12971     case OPTION_DIVIDE:
12972 #ifdef SVR4_COMMENT_CHARS
12973       {
12974         char *n, *t;
12975         const char *s;
12976
12977         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12978         t = n;
12979         for (s = i386_comment_chars; *s != '\0'; s++)
12980           if (*s != '/')
12981             *t++ = *s;
12982         *t = '\0';
12983         i386_comment_chars = n;
12984       }
12985 #endif
12986       break;
12987
12988     case OPTION_MARCH:
12989       saved = xstrdup (arg);
12990       arch = saved;
12991       /* Allow -march=+nosse.  */
12992       if (*arch == '+')
12993         arch++;
12994       do
12995         {
12996           if (*arch == '.')
12997             as_fatal (_("invalid -march= option: `%s'"), arg);
12998           next = strchr (arch, '+');
12999           if (next)
13000             *next++ = '\0';
13001           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13002             {
13003               if (strcmp (arch, cpu_arch [j].name) == 0)
13004                 {
13005                   /* Processor.  */
13006                   if (! cpu_arch[j].flags.bitfield.cpui386)
13007                     continue;
13008
13009                   cpu_arch_name = cpu_arch[j].name;
13010                   cpu_sub_arch_name = NULL;
13011                   cpu_arch_flags = cpu_arch[j].flags;
13012                   cpu_arch_isa = cpu_arch[j].type;
13013                   cpu_arch_isa_flags = cpu_arch[j].flags;
13014                   if (!cpu_arch_tune_set)
13015                     {
13016                       cpu_arch_tune = cpu_arch_isa;
13017                       cpu_arch_tune_flags = cpu_arch_isa_flags;
13018                     }
13019                   break;
13020                 }
13021               else if (*cpu_arch [j].name == '.'
13022                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
13023                 {
13024                   /* ISA extension.  */
13025                   i386_cpu_flags flags;
13026
13027                   flags = cpu_flags_or (cpu_arch_flags,
13028                                         cpu_arch[j].flags);
13029
13030                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13031                     {
13032                       if (cpu_sub_arch_name)
13033                         {
13034                           char *name = cpu_sub_arch_name;
13035                           cpu_sub_arch_name = concat (name,
13036                                                       cpu_arch[j].name,
13037                                                       (const char *) NULL);
13038                           free (name);
13039                         }
13040                       else
13041                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13042                       cpu_arch_flags = flags;
13043                       cpu_arch_isa_flags = flags;
13044                     }
13045                   else
13046                     cpu_arch_isa_flags
13047                       = cpu_flags_or (cpu_arch_isa_flags,
13048                                       cpu_arch[j].flags);
13049                   break;
13050                 }
13051             }
13052
13053           if (j >= ARRAY_SIZE (cpu_arch))
13054             {
13055               /* Disable an ISA extension.  */
13056               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13057                 if (strcmp (arch, cpu_noarch [j].name) == 0)
13058                   {
13059                     i386_cpu_flags flags;
13060
13061                     flags = cpu_flags_and_not (cpu_arch_flags,
13062                                                cpu_noarch[j].flags);
13063                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13064                       {
13065                         if (cpu_sub_arch_name)
13066                           {
13067                             char *name = cpu_sub_arch_name;
13068                             cpu_sub_arch_name = concat (arch,
13069                                                         (const char *) NULL);
13070                             free (name);
13071                           }
13072                         else
13073                           cpu_sub_arch_name = xstrdup (arch);
13074                         cpu_arch_flags = flags;
13075                         cpu_arch_isa_flags = flags;
13076                       }
13077                     break;
13078                   }
13079
13080               if (j >= ARRAY_SIZE (cpu_noarch))
13081                 j = ARRAY_SIZE (cpu_arch);
13082             }
13083
13084           if (j >= ARRAY_SIZE (cpu_arch))
13085             as_fatal (_("invalid -march= option: `%s'"), arg);
13086
13087           arch = next;
13088         }
13089       while (next != NULL);
13090       free (saved);
13091       break;
13092
13093     case OPTION_MTUNE:
13094       if (*arg == '.')
13095         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13096       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13097         {
13098           if (strcmp (arg, cpu_arch [j].name) == 0)
13099             {
13100               cpu_arch_tune_set = 1;
13101               cpu_arch_tune = cpu_arch [j].type;
13102               cpu_arch_tune_flags = cpu_arch[j].flags;
13103               break;
13104             }
13105         }
13106       if (j >= ARRAY_SIZE (cpu_arch))
13107         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13108       break;
13109
13110     case OPTION_MMNEMONIC:
13111       if (strcasecmp (arg, "att") == 0)
13112         intel_mnemonic = 0;
13113       else if (strcasecmp (arg, "intel") == 0)
13114         intel_mnemonic = 1;
13115       else
13116         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13117       break;
13118
13119     case OPTION_MSYNTAX:
13120       if (strcasecmp (arg, "att") == 0)
13121         intel_syntax = 0;
13122       else if (strcasecmp (arg, "intel") == 0)
13123         intel_syntax = 1;
13124       else
13125         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13126       break;
13127
13128     case OPTION_MINDEX_REG:
13129       allow_index_reg = 1;
13130       break;
13131
13132     case OPTION_MNAKED_REG:
13133       allow_naked_reg = 1;
13134       break;
13135
13136     case OPTION_MSSE2AVX:
13137       sse2avx = 1;
13138       break;
13139
13140     case OPTION_MSSE_CHECK:
13141       if (strcasecmp (arg, "error") == 0)
13142         sse_check = check_error;
13143       else if (strcasecmp (arg, "warning") == 0)
13144         sse_check = check_warning;
13145       else if (strcasecmp (arg, "none") == 0)
13146         sse_check = check_none;
13147       else
13148         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13149       break;
13150
13151     case OPTION_MOPERAND_CHECK:
13152       if (strcasecmp (arg, "error") == 0)
13153         operand_check = check_error;
13154       else if (strcasecmp (arg, "warning") == 0)
13155         operand_check = check_warning;
13156       else if (strcasecmp (arg, "none") == 0)
13157         operand_check = check_none;
13158       else
13159         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13160       break;
13161
13162     case OPTION_MAVXSCALAR:
13163       if (strcasecmp (arg, "128") == 0)
13164         avxscalar = vex128;
13165       else if (strcasecmp (arg, "256") == 0)
13166         avxscalar = vex256;
13167       else
13168         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13169       break;
13170
13171     case OPTION_MVEXWIG:
13172       if (strcmp (arg, "0") == 0)
13173         vexwig = vexw0;
13174       else if (strcmp (arg, "1") == 0)
13175         vexwig = vexw1;
13176       else
13177         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13178       break;
13179
13180     case OPTION_MADD_BND_PREFIX:
13181       add_bnd_prefix = 1;
13182       break;
13183
13184     case OPTION_MEVEXLIG:
13185       if (strcmp (arg, "128") == 0)
13186         evexlig = evexl128;
13187       else if (strcmp (arg, "256") == 0)
13188         evexlig = evexl256;
13189       else  if (strcmp (arg, "512") == 0)
13190         evexlig = evexl512;
13191       else
13192         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13193       break;
13194
13195     case OPTION_MEVEXRCIG:
13196       if (strcmp (arg, "rne") == 0)
13197         evexrcig = rne;
13198       else if (strcmp (arg, "rd") == 0)
13199         evexrcig = rd;
13200       else if (strcmp (arg, "ru") == 0)
13201         evexrcig = ru;
13202       else if (strcmp (arg, "rz") == 0)
13203         evexrcig = rz;
13204       else
13205         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13206       break;
13207
13208     case OPTION_MEVEXWIG:
13209       if (strcmp (arg, "0") == 0)
13210         evexwig = evexw0;
13211       else if (strcmp (arg, "1") == 0)
13212         evexwig = evexw1;
13213       else
13214         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13215       break;
13216
13217 # if defined (TE_PE) || defined (TE_PEP)
13218     case OPTION_MBIG_OBJ:
13219       use_big_obj = 1;
13220       break;
13221 #endif
13222
13223     case OPTION_MOMIT_LOCK_PREFIX:
13224       if (strcasecmp (arg, "yes") == 0)
13225         omit_lock_prefix = 1;
13226       else if (strcasecmp (arg, "no") == 0)
13227         omit_lock_prefix = 0;
13228       else
13229         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13230       break;
13231
13232     case OPTION_MFENCE_AS_LOCK_ADD:
13233       if (strcasecmp (arg, "yes") == 0)
13234         avoid_fence = 1;
13235       else if (strcasecmp (arg, "no") == 0)
13236         avoid_fence = 0;
13237       else
13238         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13239       break;
13240
13241     case OPTION_MLFENCE_AFTER_LOAD:
13242       if (strcasecmp (arg, "yes") == 0)
13243         lfence_after_load = 1;
13244       else if (strcasecmp (arg, "no") == 0)
13245         lfence_after_load = 0;
13246       else
13247         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13248       break;
13249
13250     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13251       if (strcasecmp (arg, "all") == 0)
13252         {
13253           lfence_before_indirect_branch = lfence_branch_all;
13254           if (lfence_before_ret == lfence_before_ret_none)
13255             lfence_before_ret = lfence_before_ret_shl;
13256         }
13257       else if (strcasecmp (arg, "memory") == 0)
13258         lfence_before_indirect_branch = lfence_branch_memory;
13259       else if (strcasecmp (arg, "register") == 0)
13260         lfence_before_indirect_branch = lfence_branch_register;
13261       else if (strcasecmp (arg, "none") == 0)
13262         lfence_before_indirect_branch = lfence_branch_none;
13263       else
13264         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13265                   arg);
13266       break;
13267
13268     case OPTION_MLFENCE_BEFORE_RET:
13269       if (strcasecmp (arg, "or") == 0)
13270         lfence_before_ret = lfence_before_ret_or;
13271       else if (strcasecmp (arg, "not") == 0)
13272         lfence_before_ret = lfence_before_ret_not;
13273       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13274         lfence_before_ret = lfence_before_ret_shl;
13275       else if (strcasecmp (arg, "none") == 0)
13276         lfence_before_ret = lfence_before_ret_none;
13277       else
13278         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13279                   arg);
13280       break;
13281
13282     case OPTION_MRELAX_RELOCATIONS:
13283       if (strcasecmp (arg, "yes") == 0)
13284         generate_relax_relocations = 1;
13285       else if (strcasecmp (arg, "no") == 0)
13286         generate_relax_relocations = 0;
13287       else
13288         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13289       break;
13290
13291     case OPTION_MALIGN_BRANCH_BOUNDARY:
13292       {
13293         char *end;
13294         long int align = strtoul (arg, &end, 0);
13295         if (*end == '\0')
13296           {
13297             if (align == 0)
13298               {
13299                 align_branch_power = 0;
13300                 break;
13301               }
13302             else if (align >= 16)
13303               {
13304                 int align_power;
13305                 for (align_power = 0;
13306                      (align & 1) == 0;
13307                      align >>= 1, align_power++)
13308                   continue;
13309                 /* Limit alignment power to 31.  */
13310                 if (align == 1 && align_power < 32)
13311                   {
13312                     align_branch_power = align_power;
13313                     break;
13314                   }
13315               }
13316           }
13317         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13318       }
13319       break;
13320
13321     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13322       {
13323         char *end;
13324         int align = strtoul (arg, &end, 0);
13325         /* Some processors only support 5 prefixes.  */
13326         if (*end == '\0' && align >= 0 && align < 6)
13327           {
13328             align_branch_prefix_size = align;
13329             break;
13330           }
13331         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13332                   arg);
13333       }
13334       break;
13335
13336     case OPTION_MALIGN_BRANCH:
13337       align_branch = 0;
13338       saved = xstrdup (arg);
13339       type = saved;
13340       do
13341         {
13342           next = strchr (type, '+');
13343           if (next)
13344             *next++ = '\0';
13345           if (strcasecmp (type, "jcc") == 0)
13346             align_branch |= align_branch_jcc_bit;
13347           else if (strcasecmp (type, "fused") == 0)
13348             align_branch |= align_branch_fused_bit;
13349           else if (strcasecmp (type, "jmp") == 0)
13350             align_branch |= align_branch_jmp_bit;
13351           else if (strcasecmp (type, "call") == 0)
13352             align_branch |= align_branch_call_bit;
13353           else if (strcasecmp (type, "ret") == 0)
13354             align_branch |= align_branch_ret_bit;
13355           else if (strcasecmp (type, "indirect") == 0)
13356             align_branch |= align_branch_indirect_bit;
13357           else
13358             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13359           type = next;
13360         }
13361       while (next != NULL);
13362       free (saved);
13363       break;
13364
13365     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13366       align_branch_power = 5;
13367       align_branch_prefix_size = 5;
13368       align_branch = (align_branch_jcc_bit
13369                       | align_branch_fused_bit
13370                       | align_branch_jmp_bit);
13371       break;
13372
13373     case OPTION_MAMD64:
13374       isa64 = amd64;
13375       break;
13376
13377     case OPTION_MINTEL64:
13378       isa64 = intel64;
13379       break;
13380
13381     case 'O':
13382       if (arg == NULL)
13383         {
13384           optimize = 1;
13385           /* Turn off -Os.  */
13386           optimize_for_space = 0;
13387         }
13388       else if (*arg == 's')
13389         {
13390           optimize_for_space = 1;
13391           /* Turn on all encoding optimizations.  */
13392           optimize = INT_MAX;
13393         }
13394       else
13395         {
13396           optimize = atoi (arg);
13397           /* Turn off -Os.  */
13398           optimize_for_space = 0;
13399         }
13400       break;
13401
13402     default:
13403       return 0;
13404     }
13405   return 1;
13406 }
13407
13408 #define MESSAGE_TEMPLATE \
13409 "                                                                                "
13410
13411 static char *
13412 output_message (FILE *stream, char *p, char *message, char *start,
13413                 int *left_p, const char *name, int len)
13414 {
13415   int size = sizeof (MESSAGE_TEMPLATE);
13416   int left = *left_p;
13417
13418   /* Reserve 2 spaces for ", " or ",\0" */
13419   left -= len + 2;
13420
13421   /* Check if there is any room.  */
13422   if (left >= 0)
13423     {
13424       if (p != start)
13425         {
13426           *p++ = ',';
13427           *p++ = ' ';
13428         }
13429       p = mempcpy (p, name, len);
13430     }
13431   else
13432     {
13433       /* Output the current message now and start a new one.  */
13434       *p++ = ',';
13435       *p = '\0';
13436       fprintf (stream, "%s\n", message);
13437       p = start;
13438       left = size - (start - message) - len - 2;
13439
13440       gas_assert (left >= 0);
13441
13442       p = mempcpy (p, name, len);
13443     }
13444
13445   *left_p = left;
13446   return p;
13447 }
13448
13449 static void
13450 show_arch (FILE *stream, int ext, int check)
13451 {
13452   static char message[] = MESSAGE_TEMPLATE;
13453   char *start = message + 27;
13454   char *p;
13455   int size = sizeof (MESSAGE_TEMPLATE);
13456   int left;
13457   const char *name;
13458   int len;
13459   unsigned int j;
13460
13461   p = start;
13462   left = size - (start - message);
13463   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13464     {
13465       /* Should it be skipped?  */
13466       if (cpu_arch [j].skip)
13467         continue;
13468
13469       name = cpu_arch [j].name;
13470       len = cpu_arch [j].len;
13471       if (*name == '.')
13472         {
13473           /* It is an extension.  Skip if we aren't asked to show it.  */
13474           if (ext)
13475             {
13476               name++;
13477               len--;
13478             }
13479           else
13480             continue;
13481         }
13482       else if (ext)
13483         {
13484           /* It is an processor.  Skip if we show only extension.  */
13485           continue;
13486         }
13487       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13488         {
13489           /* It is an impossible processor - skip.  */
13490           continue;
13491         }
13492
13493       p = output_message (stream, p, message, start, &left, name, len);
13494     }
13495
13496   /* Display disabled extensions.  */
13497   if (ext)
13498     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13499       {
13500         name = cpu_noarch [j].name;
13501         len = cpu_noarch [j].len;
13502         p = output_message (stream, p, message, start, &left, name,
13503                             len);
13504       }
13505
13506   *p = '\0';
13507   fprintf (stream, "%s\n", message);
13508 }
13509
13510 void
13511 md_show_usage (FILE *stream)
13512 {
13513 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13514   fprintf (stream, _("\
13515   -Qy, -Qn                ignored\n\
13516   -V                      print assembler version number\n\
13517   -k                      ignored\n"));
13518 #endif
13519   fprintf (stream, _("\
13520   -n                      Do not optimize code alignment\n\
13521   -q                      quieten some warnings\n"));
13522 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13523   fprintf (stream, _("\
13524   -s                      ignored\n"));
13525 #endif
13526 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13527                       || defined (TE_PE) || defined (TE_PEP))
13528   fprintf (stream, _("\
13529   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13530 #endif
13531 #ifdef SVR4_COMMENT_CHARS
13532   fprintf (stream, _("\
13533   --divide                do not treat `/' as a comment character\n"));
13534 #else
13535   fprintf (stream, _("\
13536   --divide                ignored\n"));
13537 #endif
13538   fprintf (stream, _("\
13539   -march=CPU[,+EXTENSION...]\n\
13540                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13541   show_arch (stream, 0, 1);
13542   fprintf (stream, _("\
13543                           EXTENSION is combination of:\n"));
13544   show_arch (stream, 1, 0);
13545   fprintf (stream, _("\
13546   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13547   show_arch (stream, 0, 0);
13548   fprintf (stream, _("\
13549   -msse2avx               encode SSE instructions with VEX prefix\n"));
13550   fprintf (stream, _("\
13551   -msse-check=[none|error|warning] (default: warning)\n\
13552                           check SSE instructions\n"));
13553   fprintf (stream, _("\
13554   -moperand-check=[none|error|warning] (default: warning)\n\
13555                           check operand combinations for validity\n"));
13556   fprintf (stream, _("\
13557   -mavxscalar=[128|256] (default: 128)\n\
13558                           encode scalar AVX instructions with specific vector\n\
13559                            length\n"));
13560   fprintf (stream, _("\
13561   -mvexwig=[0|1] (default: 0)\n\
13562                           encode VEX instructions with specific VEX.W value\n\
13563                            for VEX.W bit ignored instructions\n"));
13564   fprintf (stream, _("\
13565   -mevexlig=[128|256|512] (default: 128)\n\
13566                           encode scalar EVEX instructions with specific vector\n\
13567                            length\n"));
13568   fprintf (stream, _("\
13569   -mevexwig=[0|1] (default: 0)\n\
13570                           encode EVEX instructions with specific EVEX.W value\n\
13571                            for EVEX.W bit ignored instructions\n"));
13572   fprintf (stream, _("\
13573   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13574                           encode EVEX instructions with specific EVEX.RC value\n\
13575                            for SAE-only ignored instructions\n"));
13576   fprintf (stream, _("\
13577   -mmnemonic=[att|intel] "));
13578   if (SYSV386_COMPAT)
13579     fprintf (stream, _("(default: att)\n"));
13580   else
13581     fprintf (stream, _("(default: intel)\n"));
13582   fprintf (stream, _("\
13583                           use AT&T/Intel mnemonic\n"));
13584   fprintf (stream, _("\
13585   -msyntax=[att|intel] (default: att)\n\
13586                           use AT&T/Intel syntax\n"));
13587   fprintf (stream, _("\
13588   -mindex-reg             support pseudo index registers\n"));
13589   fprintf (stream, _("\
13590   -mnaked-reg             don't require `%%' prefix for registers\n"));
13591   fprintf (stream, _("\
13592   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13593 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13594   fprintf (stream, _("\
13595   -mshared                disable branch optimization for shared code\n"));
13596   fprintf (stream, _("\
13597   -mx86-used-note=[no|yes] "));
13598   if (DEFAULT_X86_USED_NOTE)
13599     fprintf (stream, _("(default: yes)\n"));
13600   else
13601     fprintf (stream, _("(default: no)\n"));
13602   fprintf (stream, _("\
13603                           generate x86 used ISA and feature properties\n"));
13604 #endif
13605 #if defined (TE_PE) || defined (TE_PEP)
13606   fprintf (stream, _("\
13607   -mbig-obj               generate big object files\n"));
13608 #endif
13609   fprintf (stream, _("\
13610   -momit-lock-prefix=[no|yes] (default: no)\n\
13611                           strip all lock prefixes\n"));
13612   fprintf (stream, _("\
13613   -mfence-as-lock-add=[no|yes] (default: no)\n\
13614                           encode lfence, mfence and sfence as\n\
13615                            lock addl $0x0, (%%{re}sp)\n"));
13616   fprintf (stream, _("\
13617   -mrelax-relocations=[no|yes] "));
13618   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13619     fprintf (stream, _("(default: yes)\n"));
13620   else
13621     fprintf (stream, _("(default: no)\n"));
13622   fprintf (stream, _("\
13623                           generate relax relocations\n"));
13624   fprintf (stream, _("\
13625   -malign-branch-boundary=NUM (default: 0)\n\
13626                           align branches within NUM byte boundary\n"));
13627   fprintf (stream, _("\
13628   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13629                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13630                            indirect\n\
13631                           specify types of branches to align\n"));
13632   fprintf (stream, _("\
13633   -malign-branch-prefix-size=NUM (default: 5)\n\
13634                           align branches with NUM prefixes per instruction\n"));
13635   fprintf (stream, _("\
13636   -mbranches-within-32B-boundaries\n\
13637                           align branches within 32 byte boundary\n"));
13638   fprintf (stream, _("\
13639   -mlfence-after-load=[no|yes] (default: no)\n\
13640                           generate lfence after load\n"));
13641   fprintf (stream, _("\
13642   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13643                           generate lfence before indirect near branch\n"));
13644   fprintf (stream, _("\
13645   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13646                           generate lfence before ret\n"));
13647   fprintf (stream, _("\
13648   -mamd64                 accept only AMD64 ISA [default]\n"));
13649   fprintf (stream, _("\
13650   -mintel64               accept only Intel64 ISA\n"));
13651 }
13652
13653 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13654      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13655      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13656
13657 /* Pick the target format to use.  */
13658
13659 const char *
13660 i386_target_format (void)
13661 {
13662   if (!strncmp (default_arch, "x86_64", 6))
13663     {
13664       update_code_flag (CODE_64BIT, 1);
13665       if (default_arch[6] == '\0')
13666         x86_elf_abi = X86_64_ABI;
13667       else
13668         x86_elf_abi = X86_64_X32_ABI;
13669     }
13670   else if (!strcmp (default_arch, "i386"))
13671     update_code_flag (CODE_32BIT, 1);
13672   else if (!strcmp (default_arch, "iamcu"))
13673     {
13674       update_code_flag (CODE_32BIT, 1);
13675       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13676         {
13677           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13678           cpu_arch_name = "iamcu";
13679           cpu_sub_arch_name = NULL;
13680           cpu_arch_flags = iamcu_flags;
13681           cpu_arch_isa = PROCESSOR_IAMCU;
13682           cpu_arch_isa_flags = iamcu_flags;
13683           if (!cpu_arch_tune_set)
13684             {
13685               cpu_arch_tune = cpu_arch_isa;
13686               cpu_arch_tune_flags = cpu_arch_isa_flags;
13687             }
13688         }
13689       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13690         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13691                   cpu_arch_name);
13692     }
13693   else
13694     as_fatal (_("unknown architecture"));
13695
13696   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13697     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13698   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13699     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13700
13701   switch (OUTPUT_FLAVOR)
13702     {
13703 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13704     case bfd_target_aout_flavour:
13705       return AOUT_TARGET_FORMAT;
13706 #endif
13707 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13708 # if defined (TE_PE) || defined (TE_PEP)
13709     case bfd_target_coff_flavour:
13710       if (flag_code == CODE_64BIT)
13711         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13712       else
13713         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13714 # elif defined (TE_GO32)
13715     case bfd_target_coff_flavour:
13716       return "coff-go32";
13717 # else
13718     case bfd_target_coff_flavour:
13719       return "coff-i386";
13720 # endif
13721 #endif
13722 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13723     case bfd_target_elf_flavour:
13724       {
13725         const char *format;
13726
13727         switch (x86_elf_abi)
13728           {
13729           default:
13730             format = ELF_TARGET_FORMAT;
13731 #ifndef TE_SOLARIS
13732             tls_get_addr = "___tls_get_addr";
13733 #endif
13734             break;
13735           case X86_64_ABI:
13736             use_rela_relocations = 1;
13737             object_64bit = 1;
13738 #ifndef TE_SOLARIS
13739             tls_get_addr = "__tls_get_addr";
13740 #endif
13741             format = ELF_TARGET_FORMAT64;
13742             break;
13743           case X86_64_X32_ABI:
13744             use_rela_relocations = 1;
13745             object_64bit = 1;
13746 #ifndef TE_SOLARIS
13747             tls_get_addr = "__tls_get_addr";
13748 #endif
13749             disallow_64bit_reloc = 1;
13750             format = ELF_TARGET_FORMAT32;
13751             break;
13752           }
13753         if (cpu_arch_isa == PROCESSOR_L1OM)
13754           {
13755             if (x86_elf_abi != X86_64_ABI)
13756               as_fatal (_("Intel L1OM is 64bit only"));
13757             return ELF_TARGET_L1OM_FORMAT;
13758           }
13759         else if (cpu_arch_isa == PROCESSOR_K1OM)
13760           {
13761             if (x86_elf_abi != X86_64_ABI)
13762               as_fatal (_("Intel K1OM is 64bit only"));
13763             return ELF_TARGET_K1OM_FORMAT;
13764           }
13765         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13766           {
13767             if (x86_elf_abi != I386_ABI)
13768               as_fatal (_("Intel MCU is 32bit only"));
13769             return ELF_TARGET_IAMCU_FORMAT;
13770           }
13771         else
13772           return format;
13773       }
13774 #endif
13775 #if defined (OBJ_MACH_O)
13776     case bfd_target_mach_o_flavour:
13777       if (flag_code == CODE_64BIT)
13778         {
13779           use_rela_relocations = 1;
13780           object_64bit = 1;
13781           return "mach-o-x86-64";
13782         }
13783       else
13784         return "mach-o-i386";
13785 #endif
13786     default:
13787       abort ();
13788       return NULL;
13789     }
13790 }
13791
13792 #endif /* OBJ_MAYBE_ more than one  */
13793 \f
13794 symbolS *
13795 md_undefined_symbol (char *name)
13796 {
13797   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13798       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13799       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13800       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13801     {
13802       if (!GOT_symbol)
13803         {
13804           if (symbol_find (name))
13805             as_bad (_("GOT already in symbol table"));
13806           GOT_symbol = symbol_new (name, undefined_section,
13807                                    &zero_address_frag, 0);
13808         };
13809       return GOT_symbol;
13810     }
13811   return 0;
13812 }
13813
13814 /* Round up a section size to the appropriate boundary.  */
13815
13816 valueT
13817 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13818 {
13819 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13820   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13821     {
13822       /* For a.out, force the section size to be aligned.  If we don't do
13823          this, BFD will align it for us, but it will not write out the
13824          final bytes of the section.  This may be a bug in BFD, but it is
13825          easier to fix it here since that is how the other a.out targets
13826          work.  */
13827       int align;
13828
13829       align = bfd_section_alignment (segment);
13830       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13831     }
13832 #endif
13833
13834   return size;
13835 }
13836
13837 /* On the i386, PC-relative offsets are relative to the start of the
13838    next instruction.  That is, the address of the offset, plus its
13839    size, since the offset is always the last part of the insn.  */
13840
13841 long
13842 md_pcrel_from (fixS *fixP)
13843 {
13844   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13845 }
13846
13847 #ifndef I386COFF
13848
13849 static void
13850 s_bss (int ignore ATTRIBUTE_UNUSED)
13851 {
13852   int temp;
13853
13854 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13855   if (IS_ELF)
13856     obj_elf_section_change_hook ();
13857 #endif
13858   temp = get_absolute_expression ();
13859   subseg_set (bss_section, (subsegT) temp);
13860   demand_empty_rest_of_line ();
13861 }
13862
13863 #endif
13864
13865 /* Remember constant directive.  */
13866
13867 void
13868 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13869 {
13870   if (last_insn.kind != last_insn_directive
13871       && (bfd_section_flags (now_seg) & SEC_CODE))
13872     {
13873       last_insn.seg = now_seg;
13874       last_insn.kind = last_insn_directive;
13875       last_insn.name = "constant directive";
13876       last_insn.file = as_where (&last_insn.line);
13877       if (lfence_before_ret != lfence_before_ret_none)
13878         {
13879           if (lfence_before_indirect_branch != lfence_branch_none)
13880             as_warn (_("constant directive skips -mlfence-before-ret "
13881                        "and -mlfence-before-indirect-branch"));
13882           else
13883             as_warn (_("constant directive skips -mlfence-before-ret"));
13884         }
13885       else if (lfence_before_indirect_branch != lfence_branch_none)
13886         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13887     }
13888 }
13889
13890 void
13891 i386_validate_fix (fixS *fixp)
13892 {
13893   if (fixp->fx_subsy)
13894     {
13895       if (fixp->fx_subsy == GOT_symbol)
13896         {
13897           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13898             {
13899               if (!object_64bit)
13900                 abort ();
13901 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13902               if (fixp->fx_tcbit2)
13903                 fixp->fx_r_type = (fixp->fx_tcbit
13904                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13905                                    : BFD_RELOC_X86_64_GOTPCRELX);
13906               else
13907 #endif
13908                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13909             }
13910           else
13911             {
13912               if (!object_64bit)
13913                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13914               else
13915                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13916             }
13917           fixp->fx_subsy = 0;
13918         }
13919     }
13920 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13921   else
13922     {
13923       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
13924          to section.  Since PLT32 relocation must be against symbols,
13925          turn such PLT32 relocation into PC32 relocation.  */
13926       if (fixp->fx_addsy
13927           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
13928               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
13929           && symbol_section_p (fixp->fx_addsy))
13930         fixp->fx_r_type = BFD_RELOC_32_PCREL;
13931       if (!object_64bit)
13932         {
13933           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13934               && fixp->fx_tcbit2)
13935             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13936         }
13937     }
13938 #endif
13939 }
13940
13941 arelent *
13942 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13943 {
13944   arelent *rel;
13945   bfd_reloc_code_real_type code;
13946
13947   switch (fixp->fx_r_type)
13948     {
13949 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13950     case BFD_RELOC_SIZE32:
13951     case BFD_RELOC_SIZE64:
13952       if (S_IS_DEFINED (fixp->fx_addsy)
13953           && !S_IS_EXTERNAL (fixp->fx_addsy))
13954         {
13955           /* Resolve size relocation against local symbol to size of
13956              the symbol plus addend.  */
13957           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13958           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13959               && !fits_in_unsigned_long (value))
13960             as_bad_where (fixp->fx_file, fixp->fx_line,
13961                           _("symbol size computation overflow"));
13962           fixp->fx_addsy = NULL;
13963           fixp->fx_subsy = NULL;
13964           md_apply_fix (fixp, (valueT *) &value, NULL);
13965           return NULL;
13966         }
13967 #endif
13968       /* Fall through.  */
13969
13970     case BFD_RELOC_X86_64_PLT32:
13971     case BFD_RELOC_X86_64_GOT32:
13972     case BFD_RELOC_X86_64_GOTPCREL:
13973     case BFD_RELOC_X86_64_GOTPCRELX:
13974     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13975     case BFD_RELOC_386_PLT32:
13976     case BFD_RELOC_386_GOT32:
13977     case BFD_RELOC_386_GOT32X:
13978     case BFD_RELOC_386_GOTOFF:
13979     case BFD_RELOC_386_GOTPC:
13980     case BFD_RELOC_386_TLS_GD:
13981     case BFD_RELOC_386_TLS_LDM:
13982     case BFD_RELOC_386_TLS_LDO_32:
13983     case BFD_RELOC_386_TLS_IE_32:
13984     case BFD_RELOC_386_TLS_IE:
13985     case BFD_RELOC_386_TLS_GOTIE:
13986     case BFD_RELOC_386_TLS_LE_32:
13987     case BFD_RELOC_386_TLS_LE:
13988     case BFD_RELOC_386_TLS_GOTDESC:
13989     case BFD_RELOC_386_TLS_DESC_CALL:
13990     case BFD_RELOC_X86_64_TLSGD:
13991     case BFD_RELOC_X86_64_TLSLD:
13992     case BFD_RELOC_X86_64_DTPOFF32:
13993     case BFD_RELOC_X86_64_DTPOFF64:
13994     case BFD_RELOC_X86_64_GOTTPOFF:
13995     case BFD_RELOC_X86_64_TPOFF32:
13996     case BFD_RELOC_X86_64_TPOFF64:
13997     case BFD_RELOC_X86_64_GOTOFF64:
13998     case BFD_RELOC_X86_64_GOTPC32:
13999     case BFD_RELOC_X86_64_GOT64:
14000     case BFD_RELOC_X86_64_GOTPCREL64:
14001     case BFD_RELOC_X86_64_GOTPC64:
14002     case BFD_RELOC_X86_64_GOTPLT64:
14003     case BFD_RELOC_X86_64_PLTOFF64:
14004     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14005     case BFD_RELOC_X86_64_TLSDESC_CALL:
14006     case BFD_RELOC_RVA:
14007     case BFD_RELOC_VTABLE_ENTRY:
14008     case BFD_RELOC_VTABLE_INHERIT:
14009 #ifdef TE_PE
14010     case BFD_RELOC_32_SECREL:
14011 #endif
14012       code = fixp->fx_r_type;
14013       break;
14014     case BFD_RELOC_X86_64_32S:
14015       if (!fixp->fx_pcrel)
14016         {
14017           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
14018           code = fixp->fx_r_type;
14019           break;
14020         }
14021       /* Fall through.  */
14022     default:
14023       if (fixp->fx_pcrel)
14024         {
14025           switch (fixp->fx_size)
14026             {
14027             default:
14028               as_bad_where (fixp->fx_file, fixp->fx_line,
14029                             _("can not do %d byte pc-relative relocation"),
14030                             fixp->fx_size);
14031               code = BFD_RELOC_32_PCREL;
14032               break;
14033             case 1: code = BFD_RELOC_8_PCREL;  break;
14034             case 2: code = BFD_RELOC_16_PCREL; break;
14035             case 4: code = BFD_RELOC_32_PCREL; break;
14036 #ifdef BFD64
14037             case 8: code = BFD_RELOC_64_PCREL; break;
14038 #endif
14039             }
14040         }
14041       else
14042         {
14043           switch (fixp->fx_size)
14044             {
14045             default:
14046               as_bad_where (fixp->fx_file, fixp->fx_line,
14047                             _("can not do %d byte relocation"),
14048                             fixp->fx_size);
14049               code = BFD_RELOC_32;
14050               break;
14051             case 1: code = BFD_RELOC_8;  break;
14052             case 2: code = BFD_RELOC_16; break;
14053             case 4: code = BFD_RELOC_32; break;
14054 #ifdef BFD64
14055             case 8: code = BFD_RELOC_64; break;
14056 #endif
14057             }
14058         }
14059       break;
14060     }
14061
14062   if ((code == BFD_RELOC_32
14063        || code == BFD_RELOC_32_PCREL
14064        || code == BFD_RELOC_X86_64_32S)
14065       && GOT_symbol
14066       && fixp->fx_addsy == GOT_symbol)
14067     {
14068       if (!object_64bit)
14069         code = BFD_RELOC_386_GOTPC;
14070       else
14071         code = BFD_RELOC_X86_64_GOTPC32;
14072     }
14073   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14074       && GOT_symbol
14075       && fixp->fx_addsy == GOT_symbol)
14076     {
14077       code = BFD_RELOC_X86_64_GOTPC64;
14078     }
14079
14080   rel = XNEW (arelent);
14081   rel->sym_ptr_ptr = XNEW (asymbol *);
14082   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14083
14084   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14085
14086   if (!use_rela_relocations)
14087     {
14088       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14089          vtable entry to be used in the relocation's section offset.  */
14090       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14091         rel->address = fixp->fx_offset;
14092 #if defined (OBJ_COFF) && defined (TE_PE)
14093       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14094         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14095       else
14096 #endif
14097       rel->addend = 0;
14098     }
14099   /* Use the rela in 64bit mode.  */
14100   else
14101     {
14102       if (disallow_64bit_reloc)
14103         switch (code)
14104           {
14105           case BFD_RELOC_X86_64_DTPOFF64:
14106           case BFD_RELOC_X86_64_TPOFF64:
14107           case BFD_RELOC_64_PCREL:
14108           case BFD_RELOC_X86_64_GOTOFF64:
14109           case BFD_RELOC_X86_64_GOT64:
14110           case BFD_RELOC_X86_64_GOTPCREL64:
14111           case BFD_RELOC_X86_64_GOTPC64:
14112           case BFD_RELOC_X86_64_GOTPLT64:
14113           case BFD_RELOC_X86_64_PLTOFF64:
14114             as_bad_where (fixp->fx_file, fixp->fx_line,
14115                           _("cannot represent relocation type %s in x32 mode"),
14116                           bfd_get_reloc_code_name (code));
14117             break;
14118           default:
14119             break;
14120           }
14121
14122       if (!fixp->fx_pcrel)
14123         rel->addend = fixp->fx_offset;
14124       else
14125         switch (code)
14126           {
14127           case BFD_RELOC_X86_64_PLT32:
14128           case BFD_RELOC_X86_64_GOT32:
14129           case BFD_RELOC_X86_64_GOTPCREL:
14130           case BFD_RELOC_X86_64_GOTPCRELX:
14131           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14132           case BFD_RELOC_X86_64_TLSGD:
14133           case BFD_RELOC_X86_64_TLSLD:
14134           case BFD_RELOC_X86_64_GOTTPOFF:
14135           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14136           case BFD_RELOC_X86_64_TLSDESC_CALL:
14137             rel->addend = fixp->fx_offset - fixp->fx_size;
14138             break;
14139           default:
14140             rel->addend = (section->vma
14141                            - fixp->fx_size
14142                            + fixp->fx_addnumber
14143                            + md_pcrel_from (fixp));
14144             break;
14145           }
14146     }
14147
14148   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14149   if (rel->howto == NULL)
14150     {
14151       as_bad_where (fixp->fx_file, fixp->fx_line,
14152                     _("cannot represent relocation type %s"),
14153                     bfd_get_reloc_code_name (code));
14154       /* Set howto to a garbage value so that we can keep going.  */
14155       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14156       gas_assert (rel->howto != NULL);
14157     }
14158
14159   return rel;
14160 }
14161
14162 #include "tc-i386-intel.c"
14163
14164 void
14165 tc_x86_parse_to_dw2regnum (expressionS *exp)
14166 {
14167   int saved_naked_reg;
14168   char saved_register_dot;
14169
14170   saved_naked_reg = allow_naked_reg;
14171   allow_naked_reg = 1;
14172   saved_register_dot = register_chars['.'];
14173   register_chars['.'] = '.';
14174   allow_pseudo_reg = 1;
14175   expression_and_evaluate (exp);
14176   allow_pseudo_reg = 0;
14177   register_chars['.'] = saved_register_dot;
14178   allow_naked_reg = saved_naked_reg;
14179
14180   if (exp->X_op == O_register && exp->X_add_number >= 0)
14181     {
14182       if ((addressT) exp->X_add_number < i386_regtab_size)
14183         {
14184           exp->X_op = O_constant;
14185           exp->X_add_number = i386_regtab[exp->X_add_number]
14186                               .dw2_regnum[flag_code >> 1];
14187         }
14188       else
14189         exp->X_op = O_illegal;
14190     }
14191 }
14192
14193 void
14194 tc_x86_frame_initial_instructions (void)
14195 {
14196   static unsigned int sp_regno[2];
14197
14198   if (!sp_regno[flag_code >> 1])
14199     {
14200       char *saved_input = input_line_pointer;
14201       char sp[][4] = {"esp", "rsp"};
14202       expressionS exp;
14203
14204       input_line_pointer = sp[flag_code >> 1];
14205       tc_x86_parse_to_dw2regnum (&exp);
14206       gas_assert (exp.X_op == O_constant);
14207       sp_regno[flag_code >> 1] = exp.X_add_number;
14208       input_line_pointer = saved_input;
14209     }
14210
14211   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14212   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14213 }
14214
14215 int
14216 x86_dwarf2_addr_size (void)
14217 {
14218 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14219   if (x86_elf_abi == X86_64_X32_ABI)
14220     return 4;
14221 #endif
14222   return bfd_arch_bits_per_address (stdoutput) / 8;
14223 }
14224
14225 int
14226 i386_elf_section_type (const char *str, size_t len)
14227 {
14228   if (flag_code == CODE_64BIT
14229       && len == sizeof ("unwind") - 1
14230       && strncmp (str, "unwind", 6) == 0)
14231     return SHT_X86_64_UNWIND;
14232
14233   return -1;
14234 }
14235
14236 #ifdef TE_SOLARIS
14237 void
14238 i386_solaris_fix_up_eh_frame (segT sec)
14239 {
14240   if (flag_code == CODE_64BIT)
14241     elf_section_type (sec) = SHT_X86_64_UNWIND;
14242 }
14243 #endif
14244
14245 #ifdef TE_PE
14246 void
14247 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14248 {
14249   expressionS exp;
14250
14251   exp.X_op = O_secrel;
14252   exp.X_add_symbol = symbol;
14253   exp.X_add_number = 0;
14254   emit_expr (&exp, size);
14255 }
14256 #endif
14257
14258 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14259 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14260
14261 bfd_vma
14262 x86_64_section_letter (int letter, const char **ptr_msg)
14263 {
14264   if (flag_code == CODE_64BIT)
14265     {
14266       if (letter == 'l')
14267         return SHF_X86_64_LARGE;
14268
14269       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14270     }
14271   else
14272     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14273   return -1;
14274 }
14275
14276 bfd_vma
14277 x86_64_section_word (char *str, size_t len)
14278 {
14279   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14280     return SHF_X86_64_LARGE;
14281
14282   return -1;
14283 }
14284
14285 static void
14286 handle_large_common (int small ATTRIBUTE_UNUSED)
14287 {
14288   if (flag_code != CODE_64BIT)
14289     {
14290       s_comm_internal (0, elf_common_parse);
14291       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14292     }
14293   else
14294     {
14295       static segT lbss_section;
14296       asection *saved_com_section_ptr = elf_com_section_ptr;
14297       asection *saved_bss_section = bss_section;
14298
14299       if (lbss_section == NULL)
14300         {
14301           flagword applicable;
14302           segT seg = now_seg;
14303           subsegT subseg = now_subseg;
14304
14305           /* The .lbss section is for local .largecomm symbols.  */
14306           lbss_section = subseg_new (".lbss", 0);
14307           applicable = bfd_applicable_section_flags (stdoutput);
14308           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14309           seg_info (lbss_section)->bss = 1;
14310
14311           subseg_set (seg, subseg);
14312         }
14313
14314       elf_com_section_ptr = &_bfd_elf_large_com_section;
14315       bss_section = lbss_section;
14316
14317       s_comm_internal (0, elf_common_parse);
14318
14319       elf_com_section_ptr = saved_com_section_ptr;
14320       bss_section = saved_bss_section;
14321     }
14322 }
14323 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */