gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2021 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_sib_address,
 294     invalid_vsib_address,
 295     invalid_vector_register_set,
 296     invalid_tmm_register_set,
 297     unsupported_vector_index_register,
 298     unsupported_broadcast,
 299     broadcast_needed,
 300     unsupported_masking,
 301     mask_not_on_destination,
 302     no_default_mask,
 303     unsupported_rc_sae,
 304     rc_sae_operand_not_last_imm,
 305     invalid_register_operand,
 306   };
 307
 308 struct _i386_insn
 309   {
 310     /* TM holds the template for the insn were currently assembling.  */
 311     insn_template tm;
 312
 313     /* SUFFIX holds the instruction size suffix for byte, word, dword
 314        or qword, if given.  */
 315     char suffix;
 316
 317     /* OPERANDS gives the number of given operands.  */
 318     unsigned int operands;
 319
 320     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 321        of given register, displacement, memory operands and immediate
 322        operands.  */
 323     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 324
 325     /* TYPES [i] is the type (see above #defines) which tells us how to
 326        use OP[i] for the corresponding operand.  */
 327     i386_operand_type types[MAX_OPERANDS];
 328
 329     /* Displacement expression, immediate expression, or register for each
 330        operand.  */
 331     union i386_op op[MAX_OPERANDS];
 332
 333     /* Flags for operands.  */
 334     unsigned int flags[MAX_OPERANDS];
 335 #define Operand_PCrel 1
 336 #define Operand_Mem   2
 337
 338     /* Relocation type for operand */
 339     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 340
 341     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 342        the base index byte below.  */
 343     const reg_entry *base_reg;
 344     const reg_entry *index_reg;
 345     unsigned int log2_scale_factor;
 346
 347     /* SEG gives the seg_entries of this insn.  They are zero unless
 348        explicit segment overrides are given.  */
 349     const seg_entry *seg[2];
 350
 351     /* Copied first memory operand string, for re-checking.  */
 352     char *memop1_string;
 353
 354     /* PREFIX holds all the given prefix opcodes (usually null).
 355        PREFIXES is the number of prefix opcodes.  */
 356     unsigned int prefixes;
 357     unsigned char prefix[MAX_PREFIXES];
 358
 359     /* Register is in low 3 bits of opcode.  */
 360     bfd_boolean short_form;
 361
 362     /* The operand to a branch insn indicates an absolute branch.  */
 363     bfd_boolean jumpabsolute;
 364
 365     /* Extended states.  */
 366     enum
 367       {
 368         /* Use MMX state.  */
 369         xstate_mmx = 1 << 0,
 370         /* Use XMM state.  */
 371         xstate_xmm = 1 << 1,
 372         /* Use YMM state.  */
 373         xstate_ymm = 1 << 2 | xstate_xmm,
 374         /* Use ZMM state.  */
 375         xstate_zmm = 1 << 3 | xstate_ymm,
 376         /* Use TMM state.  */
 377         xstate_tmm = 1 << 4,
 378         /* Use MASK state.  */
 379         xstate_mask = 1 << 5
 380       } xstate;
 381
 382     /* Has GOTPC or TLS relocation.  */
 383     bfd_boolean has_gotpc_tls_reloc;
 384
 385     /* RM and SIB are the modrm byte and the sib byte where the
 386        addressing modes of this insn are encoded.  */
 387     modrm_byte rm;
 388     rex_byte rex;
 389     rex_byte vrex;
 390     sib_byte sib;
 391     vex_prefix vex;
 392
 393     /* Masking attributes.  */
 394     struct Mask_Operation *mask;
 395
 396     /* Rounding control and SAE attributes.  */
 397     struct RC_Operation *rounding;
 398
 399     /* Broadcasting attributes.  */
 400     struct Broadcast_Operation *broadcast;
 401
 402     /* Compressed disp8*N attribute.  */
 403     unsigned int memshift;
 404
 405     /* Prefer load or store in encoding.  */
 406     enum
 407       {
 408         dir_encoding_default = 0,
 409         dir_encoding_load,
 410         dir_encoding_store,
 411         dir_encoding_swap
 412       } dir_encoding;
 413
 414     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 415     enum
 416       {
 417         disp_encoding_default = 0,
 418         disp_encoding_8bit,
 419         disp_encoding_16bit,
 420         disp_encoding_32bit
 421       } disp_encoding;
 422
 423     /* Prefer the REX byte in encoding.  */
 424     bfd_boolean rex_encoding;
 425
 426     /* Disable instruction size optimization.  */
 427     bfd_boolean no_optimize;
 428
 429     /* How to encode vector instructions.  */
 430     enum
 431       {
 432         vex_encoding_default = 0,
 433         vex_encoding_vex,
 434         vex_encoding_vex3,
 435         vex_encoding_evex,
 436         vex_encoding_error
 437       } vec_encoding;
 438
 439     /* REP prefix.  */
 440     const char *rep_prefix;
 441
 442     /* HLE prefix.  */
 443     const char *hle_prefix;
 444
 445     /* Have BND prefix.  */
 446     const char *bnd_prefix;
 447
 448     /* Have NOTRACK prefix.  */
 449     const char *notrack_prefix;
 450
 451     /* Error message.  */
 452     enum i386_error error;
 453   };
 454
 455 typedef struct _i386_insn i386_insn;
 456
 457 /* Link RC type with corresponding string, that'll be looked for in
 458    asm.  */
 459 struct RC_name
 460 {
 461   enum rc_type type;
 462   const char *name;
 463   unsigned int len;
 464 };
 465
 466 static const struct RC_name RC_NamesTable[] =
 467 {
 468   {  rne, STRING_COMMA_LEN ("rn-sae") },
 469   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 470   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 471   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 472   {  saeonly,  STRING_COMMA_LEN ("sae") },
 473 };
 474
 475 /* List of chars besides those in app.c:symbol_chars that can start an
 476    operand.  Used to prevent the scrubber eating vital white-space.  */
 477 const char extra_symbol_chars[] = "*%-([{}"
 478 #ifdef LEX_AT
 479         "@"
 480 #endif
 481 #ifdef LEX_QM
 482         "?"
 483 #endif
 484         ;
 485
 486 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 487      && !defined (TE_GNU)                               \
 488      && !defined (TE_LINUX)                             \
 489      && !defined (TE_FreeBSD)                           \
 490      && !defined (TE_DragonFly)                         \
 491      && !defined (TE_NetBSD))
 492 /* This array holds the chars that always start a comment.  If the
 493    pre-processor is disabled, these aren't very useful.  The option
 494    --divide will remove '/' from this list.  */
 495 const char *i386_comment_chars = "#/";
 496 #define SVR4_COMMENT_CHARS 1
 497 #define PREFIX_SEPARATOR '\\'
 498
 499 #else
 500 const char *i386_comment_chars = "#";
 501 #define PREFIX_SEPARATOR '/'
 502 #endif
 503
 504 /* This array holds the chars that only start a comment at the beginning of
 505    a line.  If the line seems to have the form '# 123 filename'
 506    .line and .file directives will appear in the pre-processed output.
 507    Note that input_file.c hand checks for '#' at the beginning of the
 508    first line of the input file.  This is because the compiler outputs
 509    #NO_APP at the beginning of its output.
 510    Also note that comments started like this one will always work if
 511    '/' isn't otherwise defined.  */
 512 const char line_comment_chars[] = "#/";
 513
 514 const char line_separator_chars[] = ";";
 515
 516 /* Chars that can be used to separate mant from exp in floating point
 517    nums.  */
 518 const char EXP_CHARS[] = "eE";
 519
 520 /* Chars that mean this number is a floating point constant
 521    As in 0f12.456
 522    or    0d1.2345e12.  */
 523 const char FLT_CHARS[] = "fFdDxX";
 524
 525 /* Tables for lexical analysis.  */
 526 static char mnemonic_chars[256];
 527 static char register_chars[256];
 528 static char operand_chars[256];
 529 static char identifier_chars[256];
 530 static char digit_chars[256];
 531
 532 /* Lexical macros.  */
 533 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 534 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 535 #define is_register_char(x) (register_chars[(unsigned char) x])
 536 #define is_space_char(x) ((x) == ' ')
 537 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 538 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 539
 540 /* All non-digit non-letter characters that may occur in an operand.  */
 541 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 542
 543 /* md_assemble() always leaves the strings it's passed unaltered.  To
 544    effect this we maintain a stack of saved characters that we've smashed
 545    with '\0's (indicating end of strings for various sub-fields of the
 546    assembler instruction).  */
 547 static char save_stack[32];
 548 static char *save_stack_p;
 549 #define END_STRING_AND_SAVE(s) \
 550         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 551 #define RESTORE_END_STRING(s) \
 552         do { *(s) = *--save_stack_p; } while (0)
 553
 554 /* The instruction we're assembling.  */
 555 static i386_insn i;
 556
 557 /* Possible templates for current insn.  */
 558 static const templates *current_templates;
 559
 560 /* Per instruction expressionS buffers: max displacements & immediates.  */
 561 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 562 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 563
 564 /* Current operand we are working on.  */
 565 static int this_operand = -1;
 566
 567 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 568    these.  */
 569
 570 enum flag_code {
 571         CODE_32BIT,
 572         CODE_16BIT,
 573         CODE_64BIT };
 574
 575 static enum flag_code flag_code;
 576 static unsigned int object_64bit;
 577 static unsigned int disallow_64bit_reloc;
 578 static int use_rela_relocations = 0;
 579 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 580 static const char *tls_get_addr;
 581
 582 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 583      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 584      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 585
 586 /* The ELF ABI to use.  */
 587 enum x86_elf_abi
 588 {
 589   I386_ABI,
 590   X86_64_ABI,
 591   X86_64_X32_ABI
 592 };
 593
 594 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 595 #endif
 596
 597 #if defined (TE_PE) || defined (TE_PEP)
 598 /* Use big object file format.  */
 599 static int use_big_obj = 0;
 600 #endif
 601
 602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 603 /* 1 if generating code for a shared library.  */
 604 static int shared = 0;
 605 #endif
 606
 607 /* 1 for intel syntax,
 608    0 if att syntax.  */
 609 static int intel_syntax = 0;
 610
 611 static enum x86_64_isa
 612 {
 613   amd64 = 1,    /* AMD64 ISA.  */
 614   intel64       /* Intel64 ISA.  */
 615 } isa64;
 616
 617 /* 1 for intel mnemonic,
 618    0 if att mnemonic.  */
 619 static int intel_mnemonic = !SYSV386_COMPAT;
 620
 621 /* 1 if pseudo registers are permitted.  */
 622 static int allow_pseudo_reg = 0;
 623
 624 /* 1 if register prefix % not required.  */
 625 static int allow_naked_reg = 0;
 626
 627 /* 1 if the assembler should add BND prefix for all control-transferring
 628    instructions supporting it, even if this prefix wasn't specified
 629    explicitly.  */
 630 static int add_bnd_prefix = 0;
 631
 632 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 633 static int allow_index_reg = 0;
 634
 635 /* 1 if the assembler should ignore LOCK prefix, even if it was
 636    specified explicitly.  */
 637 static int omit_lock_prefix = 0;
 638
 639 /* 1 if the assembler should encode lfence, mfence, and sfence as
 640    "lock addl $0, (%{re}sp)".  */
 641 static int avoid_fence = 0;
 642
 643 /* 1 if lfence should be inserted after every load.  */
 644 static int lfence_after_load = 0;
 645
 646 /* Non-zero if lfence should be inserted before indirect branch.  */
 647 static enum lfence_before_indirect_branch_kind
 648   {
 649     lfence_branch_none = 0,
 650     lfence_branch_register,
 651     lfence_branch_memory,
 652     lfence_branch_all
 653   }
 654 lfence_before_indirect_branch;
 655
 656 /* Non-zero if lfence should be inserted before ret.  */
 657 static enum lfence_before_ret_kind
 658   {
 659     lfence_before_ret_none = 0,
 660     lfence_before_ret_not,
 661     lfence_before_ret_or,
 662     lfence_before_ret_shl
 663   }
 664 lfence_before_ret;
 665
 666 /* Types of previous instruction is .byte or prefix.  */
 667 static struct
 668   {
 669     segT seg;
 670     const char *file;
 671     const char *name;
 672     unsigned int line;
 673     enum last_insn_kind
 674       {
 675         last_insn_other = 0,
 676         last_insn_directive,
 677         last_insn_prefix
 678       } kind;
 679   } last_insn;
 680
 681 /* 1 if the assembler should generate relax relocations.  */
 682
 683 static int generate_relax_relocations
 684   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 685
 686 static enum check_kind
 687   {
 688     check_none = 0,
 689     check_warning,
 690     check_error
 691   }
 692 sse_check, operand_check = check_warning;
 693
 694 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 695 static int align_branch_power = 0;
 696
 697 /* Types of branches to align.  */
 698 enum align_branch_kind
 699   {
 700     align_branch_none = 0,
 701     align_branch_jcc = 1,
 702     align_branch_fused = 2,
 703     align_branch_jmp = 3,
 704     align_branch_call = 4,
 705     align_branch_indirect = 5,
 706     align_branch_ret = 6
 707   };
 708
 709 /* Type bits of branches to align.  */
 710 enum align_branch_bit
 711   {
 712     align_branch_jcc_bit = 1 << align_branch_jcc,
 713     align_branch_fused_bit = 1 << align_branch_fused,
 714     align_branch_jmp_bit = 1 << align_branch_jmp,
 715     align_branch_call_bit = 1 << align_branch_call,
 716     align_branch_indirect_bit = 1 << align_branch_indirect,
 717     align_branch_ret_bit = 1 << align_branch_ret
 718   };
 719
 720 static unsigned int align_branch = (align_branch_jcc_bit
 721                                     | align_branch_fused_bit
 722                                     | align_branch_jmp_bit);
 723
 724 /* Types of condition jump used by macro-fusion.  */
 725 enum mf_jcc_kind
 726   {
 727     mf_jcc_jo = 0,  /* base opcode 0x70  */
 728     mf_jcc_jc,      /* base opcode 0x72  */
 729     mf_jcc_je,      /* base opcode 0x74  */
 730     mf_jcc_jna,     /* base opcode 0x76  */
 731     mf_jcc_js,      /* base opcode 0x78  */
 732     mf_jcc_jp,      /* base opcode 0x7a  */
 733     mf_jcc_jl,      /* base opcode 0x7c  */
 734     mf_jcc_jle,     /* base opcode 0x7e  */
 735   };
 736
 737 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 738 enum mf_cmp_kind
 739   {
 740     mf_cmp_test_and,  /* test/cmp */
 741     mf_cmp_alu_cmp,  /* add/sub/cmp */
 742     mf_cmp_incdec  /* inc/dec */
 743   };
 744
 745 /* The maximum padding size for fused jcc.  CMP like instruction can
 746    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 747    prefixes.   */
 748 #define MAX_FUSED_JCC_PADDING_SIZE 20
 749
 750 /* The maximum number of prefixes added for an instruction.  */
 751 static unsigned int align_branch_prefix_size = 5;
 752
 753 /* Optimization:
 754    1. Clear the REX_W bit with register operand if possible.
 755    2. Above plus use 128bit vector instruction to clear the full vector
 756       register.
 757  */
 758 static int optimize = 0;
 759
 760 /* Optimization:
 761    1. Clear the REX_W bit with register operand if possible.
 762    2. Above plus use 128bit vector instruction to clear the full vector
 763       register.
 764    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 765       "testb $imm7,%r8".
 766  */
 767 static int optimize_for_space = 0;
 768
 769 /* Register prefix used for error message.  */
 770 static const char *register_prefix = "%";
 771
 772 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 773    leave, push, and pop instructions so that gcc has the same stack
 774    frame as in 32 bit mode.  */
 775 static char stackop_size = '\0';
 776
 777 /* Non-zero to optimize code alignment.  */
 778 int optimize_align_code = 1;
 779
 780 /* Non-zero to quieten some warnings.  */
 781 static int quiet_warnings = 0;
 782
 783 /* CPU name.  */
 784 static const char *cpu_arch_name = NULL;
 785 static char *cpu_sub_arch_name = NULL;
 786
 787 /* CPU feature flags.  */
 788 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 789
 790 /* If we have selected a cpu we are generating instructions for.  */
 791 static int cpu_arch_tune_set = 0;
 792
 793 /* Cpu we are generating instructions for.  */
 794 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 795
 796 /* CPU feature flags of cpu we are generating instructions for.  */
 797 static i386_cpu_flags cpu_arch_tune_flags;
 798
 799 /* CPU instruction set architecture used.  */
 800 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 801
 802 /* CPU feature flags of instruction set architecture used.  */
 803 i386_cpu_flags cpu_arch_isa_flags;
 804
 805 /* If set, conditional jumps are not automatically promoted to handle
 806    larger than a byte offset.  */
 807 static unsigned int no_cond_jump_promotion = 0;
 808
 809 /* Encode SSE instructions with VEX prefix.  */
 810 static unsigned int sse2avx;
 811
 812 /* Encode scalar AVX instructions with specific vector length.  */
 813 static enum
 814   {
 815     vex128 = 0,
 816     vex256
 817   } avxscalar;
 818
 819 /* Encode VEX WIG instructions with specific vex.w.  */
 820 static enum
 821   {
 822     vexw0 = 0,
 823     vexw1
 824   } vexwig;
 825
 826 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 827 static enum
 828   {
 829     evexl128 = 0,
 830     evexl256,
 831     evexl512
 832   } evexlig;
 833
 834 /* Encode EVEX WIG instructions with specific evex.w.  */
 835 static enum
 836   {
 837     evexw0 = 0,
 838     evexw1
 839   } evexwig;
 840
 841 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 842 static enum rc_type evexrcig = rne;
 843
 844 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 845 static symbolS *GOT_symbol;
 846
 847 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 848 unsigned int x86_dwarf2_return_column;
 849
 850 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 851 int x86_cie_data_alignment;
 852
 853 /* Interface to relax_segment.
 854    There are 3 major relax states for 386 jump insns because the
 855    different types of jumps add different sizes to frags when we're
 856    figuring out what sort of jump to choose to reach a given label.
 857
 858    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 859    branches which are handled by md_estimate_size_before_relax() and
 860    i386_generic_table_relax_frag().  */
 861
 862 /* Types.  */
 863 #define UNCOND_JUMP 0
 864 #define COND_JUMP 1
 865 #define COND_JUMP86 2
 866 #define BRANCH_PADDING 3
 867 #define BRANCH_PREFIX 4
 868 #define FUSED_JCC_PADDING 5
 869
 870 /* Sizes.  */
 871 #define CODE16  1
 872 #define SMALL   0
 873 #define SMALL16 (SMALL | CODE16)
 874 #define BIG     2
 875 #define BIG16   (BIG | CODE16)
 876
 877 #ifndef INLINE
 878 #ifdef __GNUC__
 879 #define INLINE __inline__
 880 #else
 881 #define INLINE
 882 #endif
 883 #endif
 884
 885 #define ENCODE_RELAX_STATE(type, size) \
 886   ((relax_substateT) (((type) << 2) | (size)))
 887 #define TYPE_FROM_RELAX_STATE(s) \
 888   ((s) >> 2)
 889 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 890     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 891
 892 /* This table is used by relax_frag to promote short jumps to long
 893    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 894    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 895    don't allow a short jump in a 32 bit code segment to be promoted to
 896    a 16 bit offset jump because it's slower (requires data size
 897    prefix), and doesn't work, unless the destination is in the bottom
 898    64k of the code segment (The top 16 bits of eip are zeroed).  */
 899
 900 const relax_typeS md_relax_table[] =
 901 {
 902   /* The fields are:
 903      1) most positive reach of this state,
 904      2) most negative reach of this state,
 905      3) how many bytes this mode will have in the variable part of the frag
 906      4) which index into the table to try if we can't fit into this one.  */
 907
 908   /* UNCOND_JUMP states.  */
 909   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 910   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 911   /* dword jmp adds 4 bytes to frag:
 912      0 extra opcode bytes, 4 displacement bytes.  */
 913   {0, 0, 4, 0},
 914   /* word jmp adds 2 byte2 to frag:
 915      0 extra opcode bytes, 2 displacement bytes.  */
 916   {0, 0, 2, 0},
 917
 918   /* COND_JUMP states.  */
 919   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 920   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 921   /* dword conditionals adds 5 bytes to frag:
 922      1 extra opcode byte, 4 displacement bytes.  */
 923   {0, 0, 5, 0},
 924   /* word conditionals add 3 bytes to frag:
 925      1 extra opcode byte, 2 displacement bytes.  */
 926   {0, 0, 3, 0},
 927
 928   /* COND_JUMP86 states.  */
 929   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 930   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 931   /* dword conditionals adds 5 bytes to frag:
 932      1 extra opcode byte, 4 displacement bytes.  */
 933   {0, 0, 5, 0},
 934   /* word conditionals add 4 bytes to frag:
 935      1 displacement byte and a 3 byte long branch insn.  */
 936   {0, 0, 4, 0}
 937 };
 938
 939 static const arch_entry cpu_arch[] =
 940 {
 941   /* Do not replace the first two entries - i386_target_format()
 942      relies on them being there in this order.  */
 943   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 944     CPU_GENERIC32_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 946     CPU_GENERIC64_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 948     CPU_NONE_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 950     CPU_I186_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 952     CPU_I286_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 954     CPU_I386_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 956     CPU_I486_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 958     CPU_I586_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 960     CPU_I686_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 962     CPU_I586_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 964     CPU_PENTIUMPRO_FLAGS, 0 },
 965   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 966     CPU_P2_FLAGS, 0 },
 967   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 968     CPU_P3_FLAGS, 0 },
 969   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 970     CPU_P4_FLAGS, 0 },
 971   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 972     CPU_CORE_FLAGS, 0 },
 973   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 974     CPU_NOCONA_FLAGS, 0 },
 975   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 976     CPU_CORE_FLAGS, 1 },
 977   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 978     CPU_CORE_FLAGS, 0 },
 979   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 980     CPU_CORE2_FLAGS, 1 },
 981   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 982     CPU_CORE2_FLAGS, 0 },
 983   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 984     CPU_COREI7_FLAGS, 0 },
 985   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 986     CPU_L1OM_FLAGS, 0 },
 987   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 988     CPU_K1OM_FLAGS, 0 },
 989   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 990     CPU_IAMCU_FLAGS, 0 },
 991   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 992     CPU_K6_FLAGS, 0 },
 993   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 994     CPU_K6_2_FLAGS, 0 },
 995   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 996     CPU_ATHLON_FLAGS, 0 },
 997   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 998     CPU_K8_FLAGS, 1 },
 999   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
1000     CPU_K8_FLAGS, 0 },
1001   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1002     CPU_K8_FLAGS, 0 },
1003   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1004     CPU_AMDFAM10_FLAGS, 0 },
1005   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1006     CPU_BDVER1_FLAGS, 0 },
1007   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1008     CPU_BDVER2_FLAGS, 0 },
1009   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1010     CPU_BDVER3_FLAGS, 0 },
1011   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1012     CPU_BDVER4_FLAGS, 0 },
1013   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1014     CPU_ZNVER1_FLAGS, 0 },
1015   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1016     CPU_ZNVER2_FLAGS, 0 },
1017   { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1018     CPU_ZNVER3_FLAGS, 0 },
1019   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1020     CPU_BTVER1_FLAGS, 0 },
1021   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1022     CPU_BTVER2_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1024     CPU_8087_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1026     CPU_287_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1028     CPU_387_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1030     CPU_687_FLAGS, 0 },
1031   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1032     CPU_CMOV_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1034     CPU_FXSR_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1036     CPU_MMX_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1038     CPU_SSE_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1040     CPU_SSE2_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1042     CPU_SSE3_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1044     CPU_SSE4A_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1046     CPU_SSSE3_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1048     CPU_SSE4_1_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1050     CPU_SSE4_2_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1052     CPU_SSE4_2_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1054     CPU_AVX_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1056     CPU_AVX2_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1058     CPU_AVX512F_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1060     CPU_AVX512CD_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1062     CPU_AVX512ER_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1064     CPU_AVX512PF_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1066     CPU_AVX512DQ_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1068     CPU_AVX512BW_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1070     CPU_AVX512VL_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1072     CPU_VMX_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1074     CPU_VMFUNC_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1076     CPU_SMX_FLAGS, 0 },
1077   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1078     CPU_XSAVE_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1080     CPU_XSAVEOPT_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1082     CPU_XSAVEC_FLAGS, 0 },
1083   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1084     CPU_XSAVES_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1086     CPU_AES_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1088     CPU_PCLMUL_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1090     CPU_PCLMUL_FLAGS, 1 },
1091   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1092     CPU_FSGSBASE_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1094     CPU_RDRND_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1096     CPU_F16C_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1098     CPU_BMI2_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1100     CPU_FMA_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1102     CPU_FMA4_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1104     CPU_XOP_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1106     CPU_LWP_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1108     CPU_MOVBE_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1110     CPU_CX16_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1112     CPU_EPT_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1114     CPU_LZCNT_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1116     CPU_POPCNT_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1118     CPU_HLE_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1120     CPU_RTM_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1122     CPU_INVPCID_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1124     CPU_CLFLUSH_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1126     CPU_NOP_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1128     CPU_SYSCALL_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1130     CPU_RDTSCP_FLAGS, 0 },
1131   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1132     CPU_3DNOW_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1134     CPU_3DNOWA_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1136     CPU_PADLOCK_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1138     CPU_SVME_FLAGS, 1 },
1139   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1140     CPU_SVME_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1142     CPU_SSE4A_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1144     CPU_ABM_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1146     CPU_BMI_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1148     CPU_TBM_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1150     CPU_ADX_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1152     CPU_RDSEED_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1154     CPU_PRFCHW_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1156     CPU_SMAP_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1158     CPU_MPX_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1160     CPU_SHA_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1162     CPU_CLFLUSHOPT_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1164     CPU_PREFETCHWT1_FLAGS, 0 },
1165   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1166     CPU_SE1_FLAGS, 0 },
1167   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1168     CPU_CLWB_FLAGS, 0 },
1169   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1170     CPU_AVX512IFMA_FLAGS, 0 },
1171   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1172     CPU_AVX512VBMI_FLAGS, 0 },
1173   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1174     CPU_AVX512_4FMAPS_FLAGS, 0 },
1175   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1176     CPU_AVX512_4VNNIW_FLAGS, 0 },
1177   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1178     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1179   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1180     CPU_AVX512_VBMI2_FLAGS, 0 },
1181   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1182     CPU_AVX512_VNNI_FLAGS, 0 },
1183   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1184     CPU_AVX512_BITALG_FLAGS, 0 },
1185   { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1186     CPU_AVX_VNNI_FLAGS, 0 },
1187   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1188     CPU_CLZERO_FLAGS, 0 },
1189   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1190     CPU_MWAITX_FLAGS, 0 },
1191   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1192     CPU_OSPKE_FLAGS, 0 },
1193   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1194     CPU_RDPID_FLAGS, 0 },
1195   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1196     CPU_PTWRITE_FLAGS, 0 },
1197   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1198     CPU_IBT_FLAGS, 0 },
1199   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1200     CPU_SHSTK_FLAGS, 0 },
1201   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1202     CPU_GFNI_FLAGS, 0 },
1203   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1204     CPU_VAES_FLAGS, 0 },
1205   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1206     CPU_VPCLMULQDQ_FLAGS, 0 },
1207   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1208     CPU_WBNOINVD_FLAGS, 0 },
1209   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1210     CPU_PCONFIG_FLAGS, 0 },
1211   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1212     CPU_WAITPKG_FLAGS, 0 },
1213   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1214     CPU_CLDEMOTE_FLAGS, 0 },
1215   { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1216     CPU_AMX_INT8_FLAGS, 0 },
1217   { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1218     CPU_AMX_BF16_FLAGS, 0 },
1219   { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1220     CPU_AMX_TILE_FLAGS, 0 },
1221   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1222     CPU_MOVDIRI_FLAGS, 0 },
1223   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1224     CPU_MOVDIR64B_FLAGS, 0 },
1225   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1226     CPU_AVX512_BF16_FLAGS, 0 },
1227   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1228     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1229   { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1230     CPU_TDX_FLAGS, 0 },
1231   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1232     CPU_ENQCMD_FLAGS, 0 },
1233   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1234     CPU_SERIALIZE_FLAGS, 0 },
1235   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1236     CPU_RDPRU_FLAGS, 0 },
1237   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1238     CPU_MCOMMIT_FLAGS, 0 },
1239   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1240     CPU_SEV_ES_FLAGS, 0 },
1241   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1242     CPU_TSXLDTRK_FLAGS, 0 },
1243   { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1244     CPU_KL_FLAGS, 0 },
1245   { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1246     CPU_WIDEKL_FLAGS, 0 },
1247   { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1248     CPU_UINTR_FLAGS, 0 },
1249   { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1250     CPU_HRESET_FLAGS, 0 },
1251 };
1252
1253 static const noarch_entry cpu_noarch[] =
1254 {
1255   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1256   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1257   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1258   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1259   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1260   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1261   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1262   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1263   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1264   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1265   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1266   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1267   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1268   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1269   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1270   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1271   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1272   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1273   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1274   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1275   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1276   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1277   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1278   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1279   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1280   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1281   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1282   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1283   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1284   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1285   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1286   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1287   { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1288   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1289   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1290   { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1291   { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1292   { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1293   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1294   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1295   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1296   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1297     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1298   { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1299   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1300   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1301   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1302   { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1303   { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1304   { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1305   { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1306 };
1307
1308 #ifdef I386COFF
1309 /* Like s_lcomm_internal in gas/read.c but the alignment string
1310    is allowed to be optional.  */
1311
1312 static symbolS *
1313 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1314 {
1315   addressT align = 0;
1316
1317   SKIP_WHITESPACE ();
1318
1319   if (needs_align
1320       && *input_line_pointer == ',')
1321     {
1322       align = parse_align (needs_align - 1);
1323
1324       if (align == (addressT) -1)
1325         return NULL;
1326     }
1327   else
1328     {
1329       if (size >= 8)
1330         align = 3;
1331       else if (size >= 4)
1332         align = 2;
1333       else if (size >= 2)
1334         align = 1;
1335       else
1336         align = 0;
1337     }
1338
1339   bss_alloc (symbolP, size, align);
1340   return symbolP;
1341 }
1342
1343 static void
1344 pe_lcomm (int needs_align)
1345 {
1346   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1347 }
1348 #endif
1349
1350 const pseudo_typeS md_pseudo_table[] =
1351 {
1352 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1353   {"align", s_align_bytes, 0},
1354 #else
1355   {"align", s_align_ptwo, 0},
1356 #endif
1357   {"arch", set_cpu_arch, 0},
1358 #ifndef I386COFF
1359   {"bss", s_bss, 0},
1360 #else
1361   {"lcomm", pe_lcomm, 1},
1362 #endif
1363   {"ffloat", float_cons, 'f'},
1364   {"dfloat", float_cons, 'd'},
1365   {"tfloat", float_cons, 'x'},
1366   {"value", cons, 2},
1367   {"slong", signed_cons, 4},
1368   {"noopt", s_ignore, 0},
1369   {"optim", s_ignore, 0},
1370   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1371   {"code16", set_code_flag, CODE_16BIT},
1372   {"code32", set_code_flag, CODE_32BIT},
1373 #ifdef BFD64
1374   {"code64", set_code_flag, CODE_64BIT},
1375 #endif
1376   {"intel_syntax", set_intel_syntax, 1},
1377   {"att_syntax", set_intel_syntax, 0},
1378   {"intel_mnemonic", set_intel_mnemonic, 1},
1379   {"att_mnemonic", set_intel_mnemonic, 0},
1380   {"allow_index_reg", set_allow_index_reg, 1},
1381   {"disallow_index_reg", set_allow_index_reg, 0},
1382   {"sse_check", set_check, 0},
1383   {"operand_check", set_check, 1},
1384 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1385   {"largecomm", handle_large_common, 0},
1386 #else
1387   {"file", dwarf2_directive_file, 0},
1388   {"loc", dwarf2_directive_loc, 0},
1389   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1390 #endif
1391 #ifdef TE_PE
1392   {"secrel32", pe_directive_secrel, 0},
1393 #endif
1394   {0, 0, 0}
1395 };
1396
1397 /* For interface with expression ().  */
1398 extern char *input_line_pointer;
1399
1400 /* Hash table for instruction mnemonic lookup.  */
1401 static htab_t op_hash;
1402
1403 /* Hash table for register lookup.  */
1404 static htab_t reg_hash;
1405 \f
1406   /* Various efficient no-op patterns for aligning code labels.
1407      Note: Don't try to assemble the instructions in the comments.
1408      0L and 0w are not legal.  */
1409 static const unsigned char f32_1[] =
1410   {0x90};                               /* nop                  */
1411 static const unsigned char f32_2[] =
1412   {0x66,0x90};                          /* xchg %ax,%ax         */
1413 static const unsigned char f32_3[] =
1414   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1415 static const unsigned char f32_4[] =
1416   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1417 static const unsigned char f32_6[] =
1418   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1419 static const unsigned char f32_7[] =
1420   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1421 static const unsigned char f16_3[] =
1422   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1423 static const unsigned char f16_4[] =
1424   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1425 static const unsigned char jump_disp8[] =
1426   {0xeb};                               /* jmp disp8           */
1427 static const unsigned char jump32_disp32[] =
1428   {0xe9};                               /* jmp disp32          */
1429 static const unsigned char jump16_disp32[] =
1430   {0x66,0xe9};                          /* jmp disp32          */
1431 /* 32-bit NOPs patterns.  */
1432 static const unsigned char *const f32_patt[] = {
1433   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1434 };
1435 /* 16-bit NOPs patterns.  */
1436 static const unsigned char *const f16_patt[] = {
1437   f32_1, f32_2, f16_3, f16_4
1438 };
1439 /* nopl (%[re]ax) */
1440 static const unsigned char alt_3[] =
1441   {0x0f,0x1f,0x00};
1442 /* nopl 0(%[re]ax) */
1443 static const unsigned char alt_4[] =
1444   {0x0f,0x1f,0x40,0x00};
1445 /* nopl 0(%[re]ax,%[re]ax,1) */
1446 static const unsigned char alt_5[] =
1447   {0x0f,0x1f,0x44,0x00,0x00};
1448 /* nopw 0(%[re]ax,%[re]ax,1) */
1449 static const unsigned char alt_6[] =
1450   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1451 /* nopl 0L(%[re]ax) */
1452 static const unsigned char alt_7[] =
1453   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1454 /* nopl 0L(%[re]ax,%[re]ax,1) */
1455 static const unsigned char alt_8[] =
1456   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1457 /* nopw 0L(%[re]ax,%[re]ax,1) */
1458 static const unsigned char alt_9[] =
1459   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1460 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1461 static const unsigned char alt_10[] =
1462   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1463 /* data16 nopw %cs:0L(%eax,%eax,1) */
1464 static const unsigned char alt_11[] =
1465   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1466 /* 32-bit and 64-bit NOPs patterns.  */
1467 static const unsigned char *const alt_patt[] = {
1468   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1469   alt_9, alt_10, alt_11
1470 };
1471
1472 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1473    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1474
1475 static void
1476 i386_output_nops (char *where, const unsigned char *const *patt,
1477                   int count, int max_single_nop_size)
1478
1479 {
1480   /* Place the longer NOP first.  */
1481   int last;
1482   int offset;
1483   const unsigned char *nops;
1484
1485   if (max_single_nop_size < 1)
1486     {
1487       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1488                 max_single_nop_size);
1489       return;
1490     }
1491
1492   nops = patt[max_single_nop_size - 1];
1493
1494   /* Use the smaller one if the requsted one isn't available.  */
1495   if (nops == NULL)
1496     {
1497       max_single_nop_size--;
1498       nops = patt[max_single_nop_size - 1];
1499     }
1500
1501   last = count % max_single_nop_size;
1502
1503   count -= last;
1504   for (offset = 0; offset < count; offset += max_single_nop_size)
1505     memcpy (where + offset, nops, max_single_nop_size);
1506
1507   if (last)
1508     {
1509       nops = patt[last - 1];
1510       if (nops == NULL)
1511         {
1512           /* Use the smaller one plus one-byte NOP if the needed one
1513              isn't available.  */
1514           last--;
1515           nops = patt[last - 1];
1516           memcpy (where + offset, nops, last);
1517           where[offset + last] = *patt[0];
1518         }
1519       else
1520         memcpy (where + offset, nops, last);
1521     }
1522 }
1523
1524 static INLINE int
1525 fits_in_imm7 (offsetT num)
1526 {
1527   return (num & 0x7f) == num;
1528 }
1529
1530 static INLINE int
1531 fits_in_imm31 (offsetT num)
1532 {
1533   return (num & 0x7fffffff) == num;
1534 }
1535
1536 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1537    single NOP instruction LIMIT.  */
1538
1539 void
1540 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1541 {
1542   const unsigned char *const *patt = NULL;
1543   int max_single_nop_size;
1544   /* Maximum number of NOPs before switching to jump over NOPs.  */
1545   int max_number_of_nops;
1546
1547   switch (fragP->fr_type)
1548     {
1549     case rs_fill_nop:
1550     case rs_align_code:
1551       break;
1552     case rs_machine_dependent:
1553       /* Allow NOP padding for jumps and calls.  */
1554       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1555           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1556         break;
1557       /* Fall through.  */
1558     default:
1559       return;
1560     }
1561
1562   /* We need to decide which NOP sequence to use for 32bit and
1563      64bit. When -mtune= is used:
1564
1565      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1566      PROCESSOR_GENERIC32, f32_patt will be used.
1567      2. For the rest, alt_patt will be used.
1568
1569      When -mtune= isn't used, alt_patt will be used if
1570      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1571      be used.
1572
1573      When -march= or .arch is used, we can't use anything beyond
1574      cpu_arch_isa_flags.   */
1575
1576   if (flag_code == CODE_16BIT)
1577     {
1578       patt = f16_patt;
1579       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1580       /* Limit number of NOPs to 2 in 16-bit mode.  */
1581       max_number_of_nops = 2;
1582     }
1583   else
1584     {
1585       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1586         {
1587           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1588           switch (cpu_arch_tune)
1589             {
1590             case PROCESSOR_UNKNOWN:
1591               /* We use cpu_arch_isa_flags to check if we SHOULD
1592                  optimize with nops.  */
1593               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1594                 patt = alt_patt;
1595               else
1596                 patt = f32_patt;
1597               break;
1598             case PROCESSOR_PENTIUM4:
1599             case PROCESSOR_NOCONA:
1600             case PROCESSOR_CORE:
1601             case PROCESSOR_CORE2:
1602             case PROCESSOR_COREI7:
1603             case PROCESSOR_L1OM:
1604             case PROCESSOR_K1OM:
1605             case PROCESSOR_GENERIC64:
1606             case PROCESSOR_K6:
1607             case PROCESSOR_ATHLON:
1608             case PROCESSOR_K8:
1609             case PROCESSOR_AMDFAM10:
1610             case PROCESSOR_BD:
1611             case PROCESSOR_ZNVER:
1612             case PROCESSOR_BT:
1613               patt = alt_patt;
1614               break;
1615             case PROCESSOR_I386:
1616             case PROCESSOR_I486:
1617             case PROCESSOR_PENTIUM:
1618             case PROCESSOR_PENTIUMPRO:
1619             case PROCESSOR_IAMCU:
1620             case PROCESSOR_GENERIC32:
1621               patt = f32_patt;
1622               break;
1623             }
1624         }
1625       else
1626         {
1627           switch (fragP->tc_frag_data.tune)
1628             {
1629             case PROCESSOR_UNKNOWN:
1630               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1631                  PROCESSOR_UNKNOWN.  */
1632               abort ();
1633               break;
1634
1635             case PROCESSOR_I386:
1636             case PROCESSOR_I486:
1637             case PROCESSOR_PENTIUM:
1638             case PROCESSOR_IAMCU:
1639             case PROCESSOR_K6:
1640             case PROCESSOR_ATHLON:
1641             case PROCESSOR_K8:
1642             case PROCESSOR_AMDFAM10:
1643             case PROCESSOR_BD:
1644             case PROCESSOR_ZNVER:
1645             case PROCESSOR_BT:
1646             case PROCESSOR_GENERIC32:
1647               /* We use cpu_arch_isa_flags to check if we CAN optimize
1648                  with nops.  */
1649               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1650                 patt = alt_patt;
1651               else
1652                 patt = f32_patt;
1653               break;
1654             case PROCESSOR_PENTIUMPRO:
1655             case PROCESSOR_PENTIUM4:
1656             case PROCESSOR_NOCONA:
1657             case PROCESSOR_CORE:
1658             case PROCESSOR_CORE2:
1659             case PROCESSOR_COREI7:
1660             case PROCESSOR_L1OM:
1661             case PROCESSOR_K1OM:
1662               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1663                 patt = alt_patt;
1664               else
1665                 patt = f32_patt;
1666               break;
1667             case PROCESSOR_GENERIC64:
1668               patt = alt_patt;
1669               break;
1670             }
1671         }
1672
1673       if (patt == f32_patt)
1674         {
1675           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1676           /* Limit number of NOPs to 2 for older processors.  */
1677           max_number_of_nops = 2;
1678         }
1679       else
1680         {
1681           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1682           /* Limit number of NOPs to 7 for newer processors.  */
1683           max_number_of_nops = 7;
1684         }
1685     }
1686
1687   if (limit == 0)
1688     limit = max_single_nop_size;
1689
1690   if (fragP->fr_type == rs_fill_nop)
1691     {
1692       /* Output NOPs for .nop directive.  */
1693       if (limit > max_single_nop_size)
1694         {
1695           as_bad_where (fragP->fr_file, fragP->fr_line,
1696                         _("invalid single nop size: %d "
1697                           "(expect within [0, %d])"),
1698                         limit, max_single_nop_size);
1699           return;
1700         }
1701     }
1702   else if (fragP->fr_type != rs_machine_dependent)
1703     fragP->fr_var = count;
1704
1705   if ((count / max_single_nop_size) > max_number_of_nops)
1706     {
1707       /* Generate jump over NOPs.  */
1708       offsetT disp = count - 2;
1709       if (fits_in_imm7 (disp))
1710         {
1711           /* Use "jmp disp8" if possible.  */
1712           count = disp;
1713           where[0] = jump_disp8[0];
1714           where[1] = count;
1715           where += 2;
1716         }
1717       else
1718         {
1719           unsigned int size_of_jump;
1720
1721           if (flag_code == CODE_16BIT)
1722             {
1723               where[0] = jump16_disp32[0];
1724               where[1] = jump16_disp32[1];
1725               size_of_jump = 2;
1726             }
1727           else
1728             {
1729               where[0] = jump32_disp32[0];
1730               size_of_jump = 1;
1731             }
1732
1733           count -= size_of_jump + 4;
1734           if (!fits_in_imm31 (count))
1735             {
1736               as_bad_where (fragP->fr_file, fragP->fr_line,
1737                             _("jump over nop padding out of range"));
1738               return;
1739             }
1740
1741           md_number_to_chars (where + size_of_jump, count, 4);
1742           where += size_of_jump + 4;
1743         }
1744     }
1745
1746   /* Generate multiple NOPs.  */
1747   i386_output_nops (where, patt, count, limit);
1748 }
1749
1750 static INLINE int
1751 operand_type_all_zero (const union i386_operand_type *x)
1752 {
1753   switch (ARRAY_SIZE(x->array))
1754     {
1755     case 3:
1756       if (x->array[2])
1757         return 0;
1758       /* Fall through.  */
1759     case 2:
1760       if (x->array[1])
1761         return 0;
1762       /* Fall through.  */
1763     case 1:
1764       return !x->array[0];
1765     default:
1766       abort ();
1767     }
1768 }
1769
1770 static INLINE void
1771 operand_type_set (union i386_operand_type *x, unsigned int v)
1772 {
1773   switch (ARRAY_SIZE(x->array))
1774     {
1775     case 3:
1776       x->array[2] = v;
1777       /* Fall through.  */
1778     case 2:
1779       x->array[1] = v;
1780       /* Fall through.  */
1781     case 1:
1782       x->array[0] = v;
1783       /* Fall through.  */
1784       break;
1785     default:
1786       abort ();
1787     }
1788
1789   x->bitfield.class = ClassNone;
1790   x->bitfield.instance = InstanceNone;
1791 }
1792
1793 static INLINE int
1794 operand_type_equal (const union i386_operand_type *x,
1795                     const union i386_operand_type *y)
1796 {
1797   switch (ARRAY_SIZE(x->array))
1798     {
1799     case 3:
1800       if (x->array[2] != y->array[2])
1801         return 0;
1802       /* Fall through.  */
1803     case 2:
1804       if (x->array[1] != y->array[1])
1805         return 0;
1806       /* Fall through.  */
1807     case 1:
1808       return x->array[0] == y->array[0];
1809       break;
1810     default:
1811       abort ();
1812     }
1813 }
1814
1815 static INLINE int
1816 cpu_flags_all_zero (const union i386_cpu_flags *x)
1817 {
1818   switch (ARRAY_SIZE(x->array))
1819     {
1820     case 4:
1821       if (x->array[3])
1822         return 0;
1823       /* Fall through.  */
1824     case 3:
1825       if (x->array[2])
1826         return 0;
1827       /* Fall through.  */
1828     case 2:
1829       if (x->array[1])
1830         return 0;
1831       /* Fall through.  */
1832     case 1:
1833       return !x->array[0];
1834     default:
1835       abort ();
1836     }
1837 }
1838
1839 static INLINE int
1840 cpu_flags_equal (const union i386_cpu_flags *x,
1841                  const union i386_cpu_flags *y)
1842 {
1843   switch (ARRAY_SIZE(x->array))
1844     {
1845     case 4:
1846       if (x->array[3] != y->array[3])
1847         return 0;
1848       /* Fall through.  */
1849     case 3:
1850       if (x->array[2] != y->array[2])
1851         return 0;
1852       /* Fall through.  */
1853     case 2:
1854       if (x->array[1] != y->array[1])
1855         return 0;
1856       /* Fall through.  */
1857     case 1:
1858       return x->array[0] == y->array[0];
1859       break;
1860     default:
1861       abort ();
1862     }
1863 }
1864
1865 static INLINE int
1866 cpu_flags_check_cpu64 (i386_cpu_flags f)
1867 {
1868   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1869            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1870 }
1871
1872 static INLINE i386_cpu_flags
1873 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1874 {
1875   switch (ARRAY_SIZE (x.array))
1876     {
1877     case 4:
1878       x.array [3] &= y.array [3];
1879       /* Fall through.  */
1880     case 3:
1881       x.array [2] &= y.array [2];
1882       /* Fall through.  */
1883     case 2:
1884       x.array [1] &= y.array [1];
1885       /* Fall through.  */
1886     case 1:
1887       x.array [0] &= y.array [0];
1888       break;
1889     default:
1890       abort ();
1891     }
1892   return x;
1893 }
1894
1895 static INLINE i386_cpu_flags
1896 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1897 {
1898   switch (ARRAY_SIZE (x.array))
1899     {
1900     case 4:
1901       x.array [3] |= y.array [3];
1902       /* Fall through.  */
1903     case 3:
1904       x.array [2] |= y.array [2];
1905       /* Fall through.  */
1906     case 2:
1907       x.array [1] |= y.array [1];
1908       /* Fall through.  */
1909     case 1:
1910       x.array [0] |= y.array [0];
1911       break;
1912     default:
1913       abort ();
1914     }
1915   return x;
1916 }
1917
1918 static INLINE i386_cpu_flags
1919 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1920 {
1921   switch (ARRAY_SIZE (x.array))
1922     {
1923     case 4:
1924       x.array [3] &= ~y.array [3];
1925       /* Fall through.  */
1926     case 3:
1927       x.array [2] &= ~y.array [2];
1928       /* Fall through.  */
1929     case 2:
1930       x.array [1] &= ~y.array [1];
1931       /* Fall through.  */
1932     case 1:
1933       x.array [0] &= ~y.array [0];
1934       break;
1935     default:
1936       abort ();
1937     }
1938   return x;
1939 }
1940
1941 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1942
1943 #define CPU_FLAGS_ARCH_MATCH            0x1
1944 #define CPU_FLAGS_64BIT_MATCH           0x2
1945
1946 #define CPU_FLAGS_PERFECT_MATCH \
1947   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1948
1949 /* Return CPU flags match bits. */
1950
1951 static int
1952 cpu_flags_match (const insn_template *t)
1953 {
1954   i386_cpu_flags x = t->cpu_flags;
1955   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1956
1957   x.bitfield.cpu64 = 0;
1958   x.bitfield.cpuno64 = 0;
1959
1960   if (cpu_flags_all_zero (&x))
1961     {
1962       /* This instruction is available on all archs.  */
1963       match |= CPU_FLAGS_ARCH_MATCH;
1964     }
1965   else
1966     {
1967       /* This instruction is available only on some archs.  */
1968       i386_cpu_flags cpu = cpu_arch_flags;
1969
1970       /* AVX512VL is no standalone feature - match it and then strip it.  */
1971       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1972         return match;
1973       x.bitfield.cpuavx512vl = 0;
1974
1975       cpu = cpu_flags_and (x, cpu);
1976       if (!cpu_flags_all_zero (&cpu))
1977         {
1978           if (x.bitfield.cpuavx)
1979             {
1980               /* We need to check a few extra flags with AVX.  */
1981               if (cpu.bitfield.cpuavx
1982                   && (!t->opcode_modifier.sse2avx
1983                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1984                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1985                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1986                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1987                 match |= CPU_FLAGS_ARCH_MATCH;
1988             }
1989           else if (x.bitfield.cpuavx512f)
1990             {
1991               /* We need to check a few extra flags with AVX512F.  */
1992               if (cpu.bitfield.cpuavx512f
1993                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1994                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1995                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1996                 match |= CPU_FLAGS_ARCH_MATCH;
1997             }
1998           else
1999             match |= CPU_FLAGS_ARCH_MATCH;
2000         }
2001     }
2002   return match;
2003 }
2004
2005 static INLINE i386_operand_type
2006 operand_type_and (i386_operand_type x, i386_operand_type y)
2007 {
2008   if (x.bitfield.class != y.bitfield.class)
2009     x.bitfield.class = ClassNone;
2010   if (x.bitfield.instance != y.bitfield.instance)
2011     x.bitfield.instance = InstanceNone;
2012
2013   switch (ARRAY_SIZE (x.array))
2014     {
2015     case 3:
2016       x.array [2] &= y.array [2];
2017       /* Fall through.  */
2018     case 2:
2019       x.array [1] &= y.array [1];
2020       /* Fall through.  */
2021     case 1:
2022       x.array [0] &= y.array [0];
2023       break;
2024     default:
2025       abort ();
2026     }
2027   return x;
2028 }
2029
2030 static INLINE i386_operand_type
2031 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2032 {
2033   gas_assert (y.bitfield.class == ClassNone);
2034   gas_assert (y.bitfield.instance == InstanceNone);
2035
2036   switch (ARRAY_SIZE (x.array))
2037     {
2038     case 3:
2039       x.array [2] &= ~y.array [2];
2040       /* Fall through.  */
2041     case 2:
2042       x.array [1] &= ~y.array [1];
2043       /* Fall through.  */
2044     case 1:
2045       x.array [0] &= ~y.array [0];
2046       break;
2047     default:
2048       abort ();
2049     }
2050   return x;
2051 }
2052
2053 static INLINE i386_operand_type
2054 operand_type_or (i386_operand_type x, i386_operand_type y)
2055 {
2056   gas_assert (x.bitfield.class == ClassNone ||
2057               y.bitfield.class == ClassNone ||
2058               x.bitfield.class == y.bitfield.class);
2059   gas_assert (x.bitfield.instance == InstanceNone ||
2060               y.bitfield.instance == InstanceNone ||
2061               x.bitfield.instance == y.bitfield.instance);
2062
2063   switch (ARRAY_SIZE (x.array))
2064     {
2065     case 3:
2066       x.array [2] |= y.array [2];
2067       /* Fall through.  */
2068     case 2:
2069       x.array [1] |= y.array [1];
2070       /* Fall through.  */
2071     case 1:
2072       x.array [0] |= y.array [0];
2073       break;
2074     default:
2075       abort ();
2076     }
2077   return x;
2078 }
2079
2080 static INLINE i386_operand_type
2081 operand_type_xor (i386_operand_type x, i386_operand_type y)
2082 {
2083   gas_assert (y.bitfield.class == ClassNone);
2084   gas_assert (y.bitfield.instance == InstanceNone);
2085
2086   switch (ARRAY_SIZE (x.array))
2087     {
2088     case 3:
2089       x.array [2] ^= y.array [2];
2090       /* Fall through.  */
2091     case 2:
2092       x.array [1] ^= y.array [1];
2093       /* Fall through.  */
2094     case 1:
2095       x.array [0] ^= y.array [0];
2096       break;
2097     default:
2098       abort ();
2099     }
2100   return x;
2101 }
2102
2103 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2104 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2105 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2106 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2107 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2108 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2109 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2110 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2111 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2112 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2113 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2114 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2115 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2116 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2117 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2118 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2119 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2120
2121 enum operand_type
2122 {
2123   reg,
2124   imm,
2125   disp,
2126   anymem
2127 };
2128
2129 static INLINE int
2130 operand_type_check (i386_operand_type t, enum operand_type c)
2131 {
2132   switch (c)
2133     {
2134     case reg:
2135       return t.bitfield.class == Reg;
2136
2137     case imm:
2138       return (t.bitfield.imm8
2139               || t.bitfield.imm8s
2140               || t.bitfield.imm16
2141               || t.bitfield.imm32
2142               || t.bitfield.imm32s
2143               || t.bitfield.imm64);
2144
2145     case disp:
2146       return (t.bitfield.disp8
2147               || t.bitfield.disp16
2148               || t.bitfield.disp32
2149               || t.bitfield.disp32s
2150               || t.bitfield.disp64);
2151
2152     case anymem:
2153       return (t.bitfield.disp8
2154               || t.bitfield.disp16
2155               || t.bitfield.disp32
2156               || t.bitfield.disp32s
2157               || t.bitfield.disp64
2158               || t.bitfield.baseindex);
2159
2160     default:
2161       abort ();
2162     }
2163
2164   return 0;
2165 }
2166
2167 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2168    between operand GIVEN and opeand WANTED for instruction template T.  */
2169
2170 static INLINE int
2171 match_operand_size (const insn_template *t, unsigned int wanted,
2172                     unsigned int given)
2173 {
2174   return !((i.types[given].bitfield.byte
2175             && !t->operand_types[wanted].bitfield.byte)
2176            || (i.types[given].bitfield.word
2177                && !t->operand_types[wanted].bitfield.word)
2178            || (i.types[given].bitfield.dword
2179                && !t->operand_types[wanted].bitfield.dword)
2180            || (i.types[given].bitfield.qword
2181                && !t->operand_types[wanted].bitfield.qword)
2182            || (i.types[given].bitfield.tbyte
2183                && !t->operand_types[wanted].bitfield.tbyte));
2184 }
2185
2186 /* Return 1 if there is no conflict in SIMD register between operand
2187    GIVEN and opeand WANTED for instruction template T.  */
2188
2189 static INLINE int
2190 match_simd_size (const insn_template *t, unsigned int wanted,
2191                  unsigned int given)
2192 {
2193   return !((i.types[given].bitfield.xmmword
2194             && !t->operand_types[wanted].bitfield.xmmword)
2195            || (i.types[given].bitfield.ymmword
2196                && !t->operand_types[wanted].bitfield.ymmword)
2197            || (i.types[given].bitfield.zmmword
2198                && !t->operand_types[wanted].bitfield.zmmword)
2199            || (i.types[given].bitfield.tmmword
2200                && !t->operand_types[wanted].bitfield.tmmword));
2201 }
2202
2203 /* Return 1 if there is no conflict in any size between operand GIVEN
2204    and opeand WANTED for instruction template T.  */
2205
2206 static INLINE int
2207 match_mem_size (const insn_template *t, unsigned int wanted,
2208                 unsigned int given)
2209 {
2210   return (match_operand_size (t, wanted, given)
2211           && !((i.types[given].bitfield.unspecified
2212                 && !i.broadcast
2213                 && !t->operand_types[wanted].bitfield.unspecified)
2214                || (i.types[given].bitfield.fword
2215                    && !t->operand_types[wanted].bitfield.fword)
2216                /* For scalar opcode templates to allow register and memory
2217                   operands at the same time, some special casing is needed
2218                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2219                   down-conversion vpmov*.  */
2220                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2221                     && t->operand_types[wanted].bitfield.byte
2222                        + t->operand_types[wanted].bitfield.word
2223                        + t->operand_types[wanted].bitfield.dword
2224                        + t->operand_types[wanted].bitfield.qword
2225                        > !!t->opcode_modifier.broadcast)
2226                    ? (i.types[given].bitfield.xmmword
2227                       || i.types[given].bitfield.ymmword
2228                       || i.types[given].bitfield.zmmword)
2229                    : !match_simd_size(t, wanted, given))));
2230 }
2231
2232 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2233    operands for instruction template T, and it has MATCH_REVERSE set if there
2234    is no size conflict on any operands for the template with operands reversed
2235    (and the template allows for reversing in the first place).  */
2236
2237 #define MATCH_STRAIGHT 1
2238 #define MATCH_REVERSE  2
2239
2240 static INLINE unsigned int
2241 operand_size_match (const insn_template *t)
2242 {
2243   unsigned int j, match = MATCH_STRAIGHT;
2244
2245   /* Don't check non-absolute jump instructions.  */
2246   if (t->opcode_modifier.jump
2247       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2248     return match;
2249
2250   /* Check memory and accumulator operand size.  */
2251   for (j = 0; j < i.operands; j++)
2252     {
2253       if (i.types[j].bitfield.class != Reg
2254           && i.types[j].bitfield.class != RegSIMD
2255           && t->opcode_modifier.anysize)
2256         continue;
2257
2258       if (t->operand_types[j].bitfield.class == Reg
2259           && !match_operand_size (t, j, j))
2260         {
2261           match = 0;
2262           break;
2263         }
2264
2265       if (t->operand_types[j].bitfield.class == RegSIMD
2266           && !match_simd_size (t, j, j))
2267         {
2268           match = 0;
2269           break;
2270         }
2271
2272       if (t->operand_types[j].bitfield.instance == Accum
2273           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2274         {
2275           match = 0;
2276           break;
2277         }
2278
2279       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2280         {
2281           match = 0;
2282           break;
2283         }
2284     }
2285
2286   if (!t->opcode_modifier.d)
2287     {
2288     mismatch:
2289       if (!match)
2290         i.error = operand_size_mismatch;
2291       return match;
2292     }
2293
2294   /* Check reverse.  */
2295   gas_assert (i.operands >= 2 && i.operands <= 3);
2296
2297   for (j = 0; j < i.operands; j++)
2298     {
2299       unsigned int given = i.operands - j - 1;
2300
2301       if (t->operand_types[j].bitfield.class == Reg
2302           && !match_operand_size (t, j, given))
2303         goto mismatch;
2304
2305       if (t->operand_types[j].bitfield.class == RegSIMD
2306           && !match_simd_size (t, j, given))
2307         goto mismatch;
2308
2309       if (t->operand_types[j].bitfield.instance == Accum
2310           && (!match_operand_size (t, j, given)
2311               || !match_simd_size (t, j, given)))
2312         goto mismatch;
2313
2314       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2315         goto mismatch;
2316     }
2317
2318   return match | MATCH_REVERSE;
2319 }
2320
2321 static INLINE int
2322 operand_type_match (i386_operand_type overlap,
2323                     i386_operand_type given)
2324 {
2325   i386_operand_type temp = overlap;
2326
2327   temp.bitfield.unspecified = 0;
2328   temp.bitfield.byte = 0;
2329   temp.bitfield.word = 0;
2330   temp.bitfield.dword = 0;
2331   temp.bitfield.fword = 0;
2332   temp.bitfield.qword = 0;
2333   temp.bitfield.tbyte = 0;
2334   temp.bitfield.xmmword = 0;
2335   temp.bitfield.ymmword = 0;
2336   temp.bitfield.zmmword = 0;
2337   temp.bitfield.tmmword = 0;
2338   if (operand_type_all_zero (&temp))
2339     goto mismatch;
2340
2341   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2342     return 1;
2343
2344  mismatch:
2345   i.error = operand_type_mismatch;
2346   return 0;
2347 }
2348
2349 /* If given types g0 and g1 are registers they must be of the same type
2350    unless the expected operand type register overlap is null.
2351    Some Intel syntax memory operand size checking also happens here.  */
2352
2353 static INLINE int
2354 operand_type_register_match (i386_operand_type g0,
2355                              i386_operand_type t0,
2356                              i386_operand_type g1,
2357                              i386_operand_type t1)
2358 {
2359   if (g0.bitfield.class != Reg
2360       && g0.bitfield.class != RegSIMD
2361       && (!operand_type_check (g0, anymem)
2362           || g0.bitfield.unspecified
2363           || (t0.bitfield.class != Reg
2364               && t0.bitfield.class != RegSIMD)))
2365     return 1;
2366
2367   if (g1.bitfield.class != Reg
2368       && g1.bitfield.class != RegSIMD
2369       && (!operand_type_check (g1, anymem)
2370           || g1.bitfield.unspecified
2371           || (t1.bitfield.class != Reg
2372               && t1.bitfield.class != RegSIMD)))
2373     return 1;
2374
2375   if (g0.bitfield.byte == g1.bitfield.byte
2376       && g0.bitfield.word == g1.bitfield.word
2377       && g0.bitfield.dword == g1.bitfield.dword
2378       && g0.bitfield.qword == g1.bitfield.qword
2379       && g0.bitfield.xmmword == g1.bitfield.xmmword
2380       && g0.bitfield.ymmword == g1.bitfield.ymmword
2381       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2382     return 1;
2383
2384   if (!(t0.bitfield.byte & t1.bitfield.byte)
2385       && !(t0.bitfield.word & t1.bitfield.word)
2386       && !(t0.bitfield.dword & t1.bitfield.dword)
2387       && !(t0.bitfield.qword & t1.bitfield.qword)
2388       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2389       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2390       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2391     return 1;
2392
2393   i.error = register_type_mismatch;
2394
2395   return 0;
2396 }
2397
2398 static INLINE unsigned int
2399 register_number (const reg_entry *r)
2400 {
2401   unsigned int nr = r->reg_num;
2402
2403   if (r->reg_flags & RegRex)
2404     nr += 8;
2405
2406   if (r->reg_flags & RegVRex)
2407     nr += 16;
2408
2409   return nr;
2410 }
2411
2412 static INLINE unsigned int
2413 mode_from_disp_size (i386_operand_type t)
2414 {
2415   if (t.bitfield.disp8)
2416     return 1;
2417   else if (t.bitfield.disp16
2418            || t.bitfield.disp32
2419            || t.bitfield.disp32s)
2420     return 2;
2421   else
2422     return 0;
2423 }
2424
2425 static INLINE int
2426 fits_in_signed_byte (addressT num)
2427 {
2428   return num + 0x80 <= 0xff;
2429 }
2430
2431 static INLINE int
2432 fits_in_unsigned_byte (addressT num)
2433 {
2434   return num <= 0xff;
2435 }
2436
2437 static INLINE int
2438 fits_in_unsigned_word (addressT num)
2439 {
2440   return num <= 0xffff;
2441 }
2442
2443 static INLINE int
2444 fits_in_signed_word (addressT num)
2445 {
2446   return num + 0x8000 <= 0xffff;
2447 }
2448
2449 static INLINE int
2450 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2451 {
2452 #ifndef BFD64
2453   return 1;
2454 #else
2455   return num + 0x80000000 <= 0xffffffff;
2456 #endif
2457 }                               /* fits_in_signed_long() */
2458
2459 static INLINE int
2460 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2461 {
2462 #ifndef BFD64
2463   return 1;
2464 #else
2465   return num <= 0xffffffff;
2466 #endif
2467 }                               /* fits_in_unsigned_long() */
2468
2469 static INLINE int
2470 fits_in_disp8 (offsetT num)
2471 {
2472   int shift = i.memshift;
2473   unsigned int mask;
2474
2475   if (shift == -1)
2476     abort ();
2477
2478   mask = (1 << shift) - 1;
2479
2480   /* Return 0 if NUM isn't properly aligned.  */
2481   if ((num & mask))
2482     return 0;
2483
2484   /* Check if NUM will fit in 8bit after shift.  */
2485   return fits_in_signed_byte (num >> shift);
2486 }
2487
2488 static INLINE int
2489 fits_in_imm4 (offsetT num)
2490 {
2491   return (num & 0xf) == num;
2492 }
2493
2494 static i386_operand_type
2495 smallest_imm_type (offsetT num)
2496 {
2497   i386_operand_type t;
2498
2499   operand_type_set (&t, 0);
2500   t.bitfield.imm64 = 1;
2501
2502   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2503     {
2504       /* This code is disabled on the 486 because all the Imm1 forms
2505          in the opcode table are slower on the i486.  They're the
2506          versions with the implicitly specified single-position
2507          displacement, which has another syntax if you really want to
2508          use that form.  */
2509       t.bitfield.imm1 = 1;
2510       t.bitfield.imm8 = 1;
2511       t.bitfield.imm8s = 1;
2512       t.bitfield.imm16 = 1;
2513       t.bitfield.imm32 = 1;
2514       t.bitfield.imm32s = 1;
2515     }
2516   else if (fits_in_signed_byte (num))
2517     {
2518       t.bitfield.imm8 = 1;
2519       t.bitfield.imm8s = 1;
2520       t.bitfield.imm16 = 1;
2521       t.bitfield.imm32 = 1;
2522       t.bitfield.imm32s = 1;
2523     }
2524   else if (fits_in_unsigned_byte (num))
2525     {
2526       t.bitfield.imm8 = 1;
2527       t.bitfield.imm16 = 1;
2528       t.bitfield.imm32 = 1;
2529       t.bitfield.imm32s = 1;
2530     }
2531   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2532     {
2533       t.bitfield.imm16 = 1;
2534       t.bitfield.imm32 = 1;
2535       t.bitfield.imm32s = 1;
2536     }
2537   else if (fits_in_signed_long (num))
2538     {
2539       t.bitfield.imm32 = 1;
2540       t.bitfield.imm32s = 1;
2541     }
2542   else if (fits_in_unsigned_long (num))
2543     t.bitfield.imm32 = 1;
2544
2545   return t;
2546 }
2547
2548 static offsetT
2549 offset_in_range (offsetT val, int size)
2550 {
2551   addressT mask;
2552
2553   switch (size)
2554     {
2555     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2556     case 2: mask = ((addressT) 1 << 16) - 1; break;
2557     case 4: mask = ((addressT) 2 << 31) - 1; break;
2558 #ifdef BFD64
2559     case 8: mask = ((addressT) 2 << 63) - 1; break;
2560 #endif
2561     default: abort ();
2562     }
2563
2564   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2565     {
2566       char buf1[40], buf2[40];
2567
2568       sprint_value (buf1, val);
2569       sprint_value (buf2, val & mask);
2570       as_warn (_("%s shortened to %s"), buf1, buf2);
2571     }
2572   return val & mask;
2573 }
2574
2575 enum PREFIX_GROUP
2576 {
2577   PREFIX_EXIST = 0,
2578   PREFIX_LOCK,
2579   PREFIX_REP,
2580   PREFIX_DS,
2581   PREFIX_OTHER
2582 };
2583
2584 /* Returns
2585    a. PREFIX_EXIST if attempting to add a prefix where one from the
2586    same class already exists.
2587    b. PREFIX_LOCK if lock prefix is added.
2588    c. PREFIX_REP if rep/repne prefix is added.
2589    d. PREFIX_DS if ds prefix is added.
2590    e. PREFIX_OTHER if other prefix is added.
2591  */
2592
2593 static enum PREFIX_GROUP
2594 add_prefix (unsigned int prefix)
2595 {
2596   enum PREFIX_GROUP ret = PREFIX_OTHER;
2597   unsigned int q;
2598
2599   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2600       && flag_code == CODE_64BIT)
2601     {
2602       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2603           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2604           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2605           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2606         ret = PREFIX_EXIST;
2607       q = REX_PREFIX;
2608     }
2609   else
2610     {
2611       switch (prefix)
2612         {
2613         default:
2614           abort ();
2615
2616         case DS_PREFIX_OPCODE:
2617           ret = PREFIX_DS;
2618           /* Fall through.  */
2619         case CS_PREFIX_OPCODE:
2620         case ES_PREFIX_OPCODE:
2621         case FS_PREFIX_OPCODE:
2622         case GS_PREFIX_OPCODE:
2623         case SS_PREFIX_OPCODE:
2624           q = SEG_PREFIX;
2625           break;
2626
2627         case REPNE_PREFIX_OPCODE:
2628         case REPE_PREFIX_OPCODE:
2629           q = REP_PREFIX;
2630           ret = PREFIX_REP;
2631           break;
2632
2633         case LOCK_PREFIX_OPCODE:
2634           q = LOCK_PREFIX;
2635           ret = PREFIX_LOCK;
2636           break;
2637
2638         case FWAIT_OPCODE:
2639           q = WAIT_PREFIX;
2640           break;
2641
2642         case ADDR_PREFIX_OPCODE:
2643           q = ADDR_PREFIX;
2644           break;
2645
2646         case DATA_PREFIX_OPCODE:
2647           q = DATA_PREFIX;
2648           break;
2649         }
2650       if (i.prefix[q] != 0)
2651         ret = PREFIX_EXIST;
2652     }
2653
2654   if (ret)
2655     {
2656       if (!i.prefix[q])
2657         ++i.prefixes;
2658       i.prefix[q] |= prefix;
2659     }
2660   else
2661     as_bad (_("same type of prefix used twice"));
2662
2663   return ret;
2664 }
2665
2666 static void
2667 update_code_flag (int value, int check)
2668 {
2669   PRINTF_LIKE ((*as_error));
2670
2671   flag_code = (enum flag_code) value;
2672   if (flag_code == CODE_64BIT)
2673     {
2674       cpu_arch_flags.bitfield.cpu64 = 1;
2675       cpu_arch_flags.bitfield.cpuno64 = 0;
2676     }
2677   else
2678     {
2679       cpu_arch_flags.bitfield.cpu64 = 0;
2680       cpu_arch_flags.bitfield.cpuno64 = 1;
2681     }
2682   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2683     {
2684       if (check)
2685         as_error = as_fatal;
2686       else
2687         as_error = as_bad;
2688       (*as_error) (_("64bit mode not supported on `%s'."),
2689                    cpu_arch_name ? cpu_arch_name : default_arch);
2690     }
2691   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2692     {
2693       if (check)
2694         as_error = as_fatal;
2695       else
2696         as_error = as_bad;
2697       (*as_error) (_("32bit mode not supported on `%s'."),
2698                    cpu_arch_name ? cpu_arch_name : default_arch);
2699     }
2700   stackop_size = '\0';
2701 }
2702
2703 static void
2704 set_code_flag (int value)
2705 {
2706   update_code_flag (value, 0);
2707 }
2708
2709 static void
2710 set_16bit_gcc_code_flag (int new_code_flag)
2711 {
2712   flag_code = (enum flag_code) new_code_flag;
2713   if (flag_code != CODE_16BIT)
2714     abort ();
2715   cpu_arch_flags.bitfield.cpu64 = 0;
2716   cpu_arch_flags.bitfield.cpuno64 = 1;
2717   stackop_size = LONG_MNEM_SUFFIX;
2718 }
2719
2720 static void
2721 set_intel_syntax (int syntax_flag)
2722 {
2723   /* Find out if register prefixing is specified.  */
2724   int ask_naked_reg = 0;
2725
2726   SKIP_WHITESPACE ();
2727   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2728     {
2729       char *string;
2730       int e = get_symbol_name (&string);
2731
2732       if (strcmp (string, "prefix") == 0)
2733         ask_naked_reg = 1;
2734       else if (strcmp (string, "noprefix") == 0)
2735         ask_naked_reg = -1;
2736       else
2737         as_bad (_("bad argument to syntax directive."));
2738       (void) restore_line_pointer (e);
2739     }
2740   demand_empty_rest_of_line ();
2741
2742   intel_syntax = syntax_flag;
2743
2744   if (ask_naked_reg == 0)
2745     allow_naked_reg = (intel_syntax
2746                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2747   else
2748     allow_naked_reg = (ask_naked_reg < 0);
2749
2750   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2751
2752   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2753   identifier_chars['$'] = intel_syntax ? '$' : 0;
2754   register_prefix = allow_naked_reg ? "" : "%";
2755 }
2756
2757 static void
2758 set_intel_mnemonic (int mnemonic_flag)
2759 {
2760   intel_mnemonic = mnemonic_flag;
2761 }
2762
2763 static void
2764 set_allow_index_reg (int flag)
2765 {
2766   allow_index_reg = flag;
2767 }
2768
2769 static void
2770 set_check (int what)
2771 {
2772   enum check_kind *kind;
2773   const char *str;
2774
2775   if (what)
2776     {
2777       kind = &operand_check;
2778       str = "operand";
2779     }
2780   else
2781     {
2782       kind = &sse_check;
2783       str = "sse";
2784     }
2785
2786   SKIP_WHITESPACE ();
2787
2788   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2789     {
2790       char *string;
2791       int e = get_symbol_name (&string);
2792
2793       if (strcmp (string, "none") == 0)
2794         *kind = check_none;
2795       else if (strcmp (string, "warning") == 0)
2796         *kind = check_warning;
2797       else if (strcmp (string, "error") == 0)
2798         *kind = check_error;
2799       else
2800         as_bad (_("bad argument to %s_check directive."), str);
2801       (void) restore_line_pointer (e);
2802     }
2803   else
2804     as_bad (_("missing argument for %s_check directive"), str);
2805
2806   demand_empty_rest_of_line ();
2807 }
2808
2809 static void
2810 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2811                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2812 {
2813 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2814   static const char *arch;
2815
2816   /* Intel LIOM is only supported on ELF.  */
2817   if (!IS_ELF)
2818     return;
2819
2820   if (!arch)
2821     {
2822       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2823          use default_arch.  */
2824       arch = cpu_arch_name;
2825       if (!arch)
2826         arch = default_arch;
2827     }
2828
2829   /* If we are targeting Intel MCU, we must enable it.  */
2830   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2831       || new_flag.bitfield.cpuiamcu)
2832     return;
2833
2834   /* If we are targeting Intel L1OM, we must enable it.  */
2835   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2836       || new_flag.bitfield.cpul1om)
2837     return;
2838
2839   /* If we are targeting Intel K1OM, we must enable it.  */
2840   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2841       || new_flag.bitfield.cpuk1om)
2842     return;
2843
2844   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2845 #endif
2846 }
2847
2848 static void
2849 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2850 {
2851   SKIP_WHITESPACE ();
2852
2853   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2854     {
2855       char *string;
2856       int e = get_symbol_name (&string);
2857       unsigned int j;
2858       i386_cpu_flags flags;
2859
2860       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2861         {
2862           if (strcmp (string, cpu_arch[j].name) == 0)
2863             {
2864               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2865
2866               if (*string != '.')
2867                 {
2868                   cpu_arch_name = cpu_arch[j].name;
2869                   cpu_sub_arch_name = NULL;
2870                   cpu_arch_flags = cpu_arch[j].flags;
2871                   if (flag_code == CODE_64BIT)
2872                     {
2873                       cpu_arch_flags.bitfield.cpu64 = 1;
2874                       cpu_arch_flags.bitfield.cpuno64 = 0;
2875                     }
2876                   else
2877                     {
2878                       cpu_arch_flags.bitfield.cpu64 = 0;
2879                       cpu_arch_flags.bitfield.cpuno64 = 1;
2880                     }
2881                   cpu_arch_isa = cpu_arch[j].type;
2882                   cpu_arch_isa_flags = cpu_arch[j].flags;
2883                   if (!cpu_arch_tune_set)
2884                     {
2885                       cpu_arch_tune = cpu_arch_isa;
2886                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2887                     }
2888                   break;
2889                 }
2890
2891               flags = cpu_flags_or (cpu_arch_flags,
2892                                     cpu_arch[j].flags);
2893
2894               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2895                 {
2896                   if (cpu_sub_arch_name)
2897                     {
2898                       char *name = cpu_sub_arch_name;
2899                       cpu_sub_arch_name = concat (name,
2900                                                   cpu_arch[j].name,
2901                                                   (const char *) NULL);
2902                       free (name);
2903                     }
2904                   else
2905                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2906                   cpu_arch_flags = flags;
2907                   cpu_arch_isa_flags = flags;
2908                 }
2909               else
2910                 cpu_arch_isa_flags
2911                   = cpu_flags_or (cpu_arch_isa_flags,
2912                                   cpu_arch[j].flags);
2913               (void) restore_line_pointer (e);
2914               demand_empty_rest_of_line ();
2915               return;
2916             }
2917         }
2918
2919       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2920         {
2921           /* Disable an ISA extension.  */
2922           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2923             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2924               {
2925                 flags = cpu_flags_and_not (cpu_arch_flags,
2926                                            cpu_noarch[j].flags);
2927                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2928                   {
2929                     if (cpu_sub_arch_name)
2930                       {
2931                         char *name = cpu_sub_arch_name;
2932                         cpu_sub_arch_name = concat (name, string,
2933                                                     (const char *) NULL);
2934                         free (name);
2935                       }
2936                     else
2937                       cpu_sub_arch_name = xstrdup (string);
2938                     cpu_arch_flags = flags;
2939                     cpu_arch_isa_flags = flags;
2940                   }
2941                 (void) restore_line_pointer (e);
2942                 demand_empty_rest_of_line ();
2943                 return;
2944               }
2945
2946           j = ARRAY_SIZE (cpu_arch);
2947         }
2948
2949       if (j >= ARRAY_SIZE (cpu_arch))
2950         as_bad (_("no such architecture: `%s'"), string);
2951
2952       *input_line_pointer = e;
2953     }
2954   else
2955     as_bad (_("missing cpu architecture"));
2956
2957   no_cond_jump_promotion = 0;
2958   if (*input_line_pointer == ','
2959       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2960     {
2961       char *string;
2962       char e;
2963
2964       ++input_line_pointer;
2965       e = get_symbol_name (&string);
2966
2967       if (strcmp (string, "nojumps") == 0)
2968         no_cond_jump_promotion = 1;
2969       else if (strcmp (string, "jumps") == 0)
2970         ;
2971       else
2972         as_bad (_("no such architecture modifier: `%s'"), string);
2973
2974       (void) restore_line_pointer (e);
2975     }
2976
2977   demand_empty_rest_of_line ();
2978 }
2979
2980 enum bfd_architecture
2981 i386_arch (void)
2982 {
2983   if (cpu_arch_isa == PROCESSOR_L1OM)
2984     {
2985       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986           || flag_code != CODE_64BIT)
2987         as_fatal (_("Intel L1OM is 64bit ELF only"));
2988       return bfd_arch_l1om;
2989     }
2990   else if (cpu_arch_isa == PROCESSOR_K1OM)
2991     {
2992       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993           || flag_code != CODE_64BIT)
2994         as_fatal (_("Intel K1OM is 64bit ELF only"));
2995       return bfd_arch_k1om;
2996     }
2997   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2998     {
2999       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3000           || flag_code == CODE_64BIT)
3001         as_fatal (_("Intel MCU is 32bit ELF only"));
3002       return bfd_arch_iamcu;
3003     }
3004   else
3005     return bfd_arch_i386;
3006 }
3007
3008 unsigned long
3009 i386_mach (void)
3010 {
3011   if (!strncmp (default_arch, "x86_64", 6))
3012     {
3013       if (cpu_arch_isa == PROCESSOR_L1OM)
3014         {
3015           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3016               || default_arch[6] != '\0')
3017             as_fatal (_("Intel L1OM is 64bit ELF only"));
3018           return bfd_mach_l1om;
3019         }
3020       else if (cpu_arch_isa == PROCESSOR_K1OM)
3021         {
3022           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3023               || default_arch[6] != '\0')
3024             as_fatal (_("Intel K1OM is 64bit ELF only"));
3025           return bfd_mach_k1om;
3026         }
3027       else if (default_arch[6] == '\0')
3028         return bfd_mach_x86_64;
3029       else
3030         return bfd_mach_x64_32;
3031     }
3032   else if (!strcmp (default_arch, "i386")
3033            || !strcmp (default_arch, "iamcu"))
3034     {
3035       if (cpu_arch_isa == PROCESSOR_IAMCU)
3036         {
3037           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3038             as_fatal (_("Intel MCU is 32bit ELF only"));
3039           return bfd_mach_i386_iamcu;
3040         }
3041       else
3042         return bfd_mach_i386_i386;
3043     }
3044   else
3045     as_fatal (_("unknown architecture"));
3046 }
3047 \f
3048 void
3049 md_begin (void)
3050 {
3051   /* Support pseudo prefixes like {disp32}.  */
3052   lex_type ['{'] = LEX_BEGIN_NAME;
3053
3054   /* Initialize op_hash hash table.  */
3055   op_hash = str_htab_create ();
3056
3057   {
3058     const insn_template *optab;
3059     templates *core_optab;
3060
3061     /* Setup for loop.  */
3062     optab = i386_optab;
3063     core_optab = XNEW (templates);
3064     core_optab->start = optab;
3065
3066     while (1)
3067       {
3068         ++optab;
3069         if (optab->name == NULL
3070             || strcmp (optab->name, (optab - 1)->name) != 0)
3071           {
3072             /* different name --> ship out current template list;
3073                add to hash table; & begin anew.  */
3074             core_optab->end = optab;
3075             if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3076               as_fatal (_("duplicate %s"), (optab - 1)->name);
3077
3078             if (optab->name == NULL)
3079               break;
3080             core_optab = XNEW (templates);
3081             core_optab->start = optab;
3082           }
3083       }
3084   }
3085
3086   /* Initialize reg_hash hash table.  */
3087   reg_hash = str_htab_create ();
3088   {
3089     const reg_entry *regtab;
3090     unsigned int regtab_size = i386_regtab_size;
3091
3092     for (regtab = i386_regtab; regtab_size--; regtab++)
3093       if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3094         as_fatal (_("duplicate %s"), regtab->reg_name);
3095   }
3096
3097   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3098   {
3099     int c;
3100     char *p;
3101
3102     for (c = 0; c < 256; c++)
3103       {
3104         if (ISDIGIT (c))
3105           {
3106             digit_chars[c] = c;
3107             mnemonic_chars[c] = c;
3108             register_chars[c] = c;
3109             operand_chars[c] = c;
3110           }
3111         else if (ISLOWER (c))
3112           {
3113             mnemonic_chars[c] = c;
3114             register_chars[c] = c;
3115             operand_chars[c] = c;
3116           }
3117         else if (ISUPPER (c))
3118           {
3119             mnemonic_chars[c] = TOLOWER (c);
3120             register_chars[c] = mnemonic_chars[c];
3121             operand_chars[c] = c;
3122           }
3123         else if (c == '{' || c == '}')
3124           {
3125             mnemonic_chars[c] = c;
3126             operand_chars[c] = c;
3127           }
3128 #ifdef SVR4_COMMENT_CHARS
3129         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3130           operand_chars[c] = c;
3131 #endif
3132
3133         if (ISALPHA (c) || ISDIGIT (c))
3134           identifier_chars[c] = c;
3135         else if (c >= 128)
3136           {
3137             identifier_chars[c] = c;
3138             operand_chars[c] = c;
3139           }
3140       }
3141
3142 #ifdef LEX_AT
3143     identifier_chars['@'] = '@';
3144 #endif
3145 #ifdef LEX_QM
3146     identifier_chars['?'] = '?';
3147     operand_chars['?'] = '?';
3148 #endif
3149     digit_chars['-'] = '-';
3150     mnemonic_chars['_'] = '_';
3151     mnemonic_chars['-'] = '-';
3152     mnemonic_chars['.'] = '.';
3153     identifier_chars['_'] = '_';
3154     identifier_chars['.'] = '.';
3155
3156     for (p = operand_special_chars; *p != '\0'; p++)
3157       operand_chars[(unsigned char) *p] = *p;
3158   }
3159
3160   if (flag_code == CODE_64BIT)
3161     {
3162 #if defined (OBJ_COFF) && defined (TE_PE)
3163       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3164                                   ? 32 : 16);
3165 #else
3166       x86_dwarf2_return_column = 16;
3167 #endif
3168       x86_cie_data_alignment = -8;
3169     }
3170   else
3171     {
3172       x86_dwarf2_return_column = 8;
3173       x86_cie_data_alignment = -4;
3174     }
3175
3176   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3177      can be turned into BRANCH_PREFIX frag.  */
3178   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3179     abort ();
3180 }
3181
3182 void
3183 i386_print_statistics (FILE *file)
3184 {
3185   htab_print_statistics (file, "i386 opcode", op_hash);
3186   htab_print_statistics (file, "i386 register", reg_hash);
3187 }
3188 \f
3189 #ifdef DEBUG386
3190
3191 /* Debugging routines for md_assemble.  */
3192 static void pte (insn_template *);
3193 static void pt (i386_operand_type);
3194 static void pe (expressionS *);
3195 static void ps (symbolS *);
3196
3197 static void
3198 pi (const char *line, i386_insn *x)
3199 {
3200   unsigned int j;
3201
3202   fprintf (stdout, "%s: template ", line);
3203   pte (&x->tm);
3204   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3205            x->base_reg ? x->base_reg->reg_name : "none",
3206            x->index_reg ? x->index_reg->reg_name : "none",
3207            x->log2_scale_factor);
3208   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3209            x->rm.mode, x->rm.reg, x->rm.regmem);
3210   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3211            x->sib.base, x->sib.index, x->sib.scale);
3212   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3213            (x->rex & REX_W) != 0,
3214            (x->rex & REX_R) != 0,
3215            (x->rex & REX_X) != 0,
3216            (x->rex & REX_B) != 0);
3217   for (j = 0; j < x->operands; j++)
3218     {
3219       fprintf (stdout, "    #%d:  ", j + 1);
3220       pt (x->types[j]);
3221       fprintf (stdout, "\n");
3222       if (x->types[j].bitfield.class == Reg
3223           || x->types[j].bitfield.class == RegMMX
3224           || x->types[j].bitfield.class == RegSIMD
3225           || x->types[j].bitfield.class == RegMask
3226           || x->types[j].bitfield.class == SReg
3227           || x->types[j].bitfield.class == RegCR
3228           || x->types[j].bitfield.class == RegDR
3229           || x->types[j].bitfield.class == RegTR
3230           || x->types[j].bitfield.class == RegBND)
3231         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3232       if (operand_type_check (x->types[j], imm))
3233         pe (x->op[j].imms);
3234       if (operand_type_check (x->types[j], disp))
3235         pe (x->op[j].disps);
3236     }
3237 }
3238
3239 static void
3240 pte (insn_template *t)
3241 {
3242   unsigned int j;
3243   fprintf (stdout, " %d operands ", t->operands);
3244   fprintf (stdout, "opcode %x ", t->base_opcode);
3245   if (t->extension_opcode != None)
3246     fprintf (stdout, "ext %x ", t->extension_opcode);
3247   if (t->opcode_modifier.d)
3248     fprintf (stdout, "D");
3249   if (t->opcode_modifier.w)
3250     fprintf (stdout, "W");
3251   fprintf (stdout, "\n");
3252   for (j = 0; j < t->operands; j++)
3253     {
3254       fprintf (stdout, "    #%d type ", j + 1);
3255       pt (t->operand_types[j]);
3256       fprintf (stdout, "\n");
3257     }
3258 }
3259
3260 static void
3261 pe (expressionS *e)
3262 {
3263   fprintf (stdout, "    operation     %d\n", e->X_op);
3264   fprintf (stdout, "    add_number    %ld (%lx)\n",
3265            (long) e->X_add_number, (long) e->X_add_number);
3266   if (e->X_add_symbol)
3267     {
3268       fprintf (stdout, "    add_symbol    ");
3269       ps (e->X_add_symbol);
3270       fprintf (stdout, "\n");
3271     }
3272   if (e->X_op_symbol)
3273     {
3274       fprintf (stdout, "    op_symbol    ");
3275       ps (e->X_op_symbol);
3276       fprintf (stdout, "\n");
3277     }
3278 }
3279
3280 static void
3281 ps (symbolS *s)
3282 {
3283   fprintf (stdout, "%s type %s%s",
3284            S_GET_NAME (s),
3285            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3286            segment_name (S_GET_SEGMENT (s)));
3287 }
3288
3289 static struct type_name
3290   {
3291     i386_operand_type mask;
3292     const char *name;
3293   }
3294 const type_names[] =
3295 {
3296   { OPERAND_TYPE_REG8, "r8" },
3297   { OPERAND_TYPE_REG16, "r16" },
3298   { OPERAND_TYPE_REG32, "r32" },
3299   { OPERAND_TYPE_REG64, "r64" },
3300   { OPERAND_TYPE_ACC8, "acc8" },
3301   { OPERAND_TYPE_ACC16, "acc16" },
3302   { OPERAND_TYPE_ACC32, "acc32" },
3303   { OPERAND_TYPE_ACC64, "acc64" },
3304   { OPERAND_TYPE_IMM8, "i8" },
3305   { OPERAND_TYPE_IMM8, "i8s" },
3306   { OPERAND_TYPE_IMM16, "i16" },
3307   { OPERAND_TYPE_IMM32, "i32" },
3308   { OPERAND_TYPE_IMM32S, "i32s" },
3309   { OPERAND_TYPE_IMM64, "i64" },
3310   { OPERAND_TYPE_IMM1, "i1" },
3311   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3312   { OPERAND_TYPE_DISP8, "d8" },
3313   { OPERAND_TYPE_DISP16, "d16" },
3314   { OPERAND_TYPE_DISP32, "d32" },
3315   { OPERAND_TYPE_DISP32S, "d32s" },
3316   { OPERAND_TYPE_DISP64, "d64" },
3317   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3318   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3319   { OPERAND_TYPE_CONTROL, "control reg" },
3320   { OPERAND_TYPE_TEST, "test reg" },
3321   { OPERAND_TYPE_DEBUG, "debug reg" },
3322   { OPERAND_TYPE_FLOATREG, "FReg" },
3323   { OPERAND_TYPE_FLOATACC, "FAcc" },
3324   { OPERAND_TYPE_SREG, "SReg" },
3325   { OPERAND_TYPE_REGMMX, "rMMX" },
3326   { OPERAND_TYPE_REGXMM, "rXMM" },
3327   { OPERAND_TYPE_REGYMM, "rYMM" },
3328   { OPERAND_TYPE_REGZMM, "rZMM" },
3329   { OPERAND_TYPE_REGTMM, "rTMM" },
3330   { OPERAND_TYPE_REGMASK, "Mask reg" },
3331 };
3332
3333 static void
3334 pt (i386_operand_type t)
3335 {
3336   unsigned int j;
3337   i386_operand_type a;
3338
3339   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3340     {
3341       a = operand_type_and (t, type_names[j].mask);
3342       if (operand_type_equal (&a, &type_names[j].mask))
3343         fprintf (stdout, "%s, ",  type_names[j].name);
3344     }
3345   fflush (stdout);
3346 }
3347
3348 #endif /* DEBUG386 */
3349 \f
3350 static bfd_reloc_code_real_type
3351 reloc (unsigned int size,
3352        int pcrel,
3353        int sign,
3354        bfd_reloc_code_real_type other)
3355 {
3356   if (other != NO_RELOC)
3357     {
3358       reloc_howto_type *rel;
3359
3360       if (size == 8)
3361         switch (other)
3362           {
3363           case BFD_RELOC_X86_64_GOT32:
3364             return BFD_RELOC_X86_64_GOT64;
3365             break;
3366           case BFD_RELOC_X86_64_GOTPLT64:
3367             return BFD_RELOC_X86_64_GOTPLT64;
3368             break;
3369           case BFD_RELOC_X86_64_PLTOFF64:
3370             return BFD_RELOC_X86_64_PLTOFF64;
3371             break;
3372           case BFD_RELOC_X86_64_GOTPC32:
3373             other = BFD_RELOC_X86_64_GOTPC64;
3374             break;
3375           case BFD_RELOC_X86_64_GOTPCREL:
3376             other = BFD_RELOC_X86_64_GOTPCREL64;
3377             break;
3378           case BFD_RELOC_X86_64_TPOFF32:
3379             other = BFD_RELOC_X86_64_TPOFF64;
3380             break;
3381           case BFD_RELOC_X86_64_DTPOFF32:
3382             other = BFD_RELOC_X86_64_DTPOFF64;
3383             break;
3384           default:
3385             break;
3386           }
3387
3388 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3389       if (other == BFD_RELOC_SIZE32)
3390         {
3391           if (size == 8)
3392             other = BFD_RELOC_SIZE64;
3393           if (pcrel)
3394             {
3395               as_bad (_("there are no pc-relative size relocations"));
3396               return NO_RELOC;
3397             }
3398         }
3399 #endif
3400
3401       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3402       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3403         sign = -1;
3404
3405       rel = bfd_reloc_type_lookup (stdoutput, other);
3406       if (!rel)
3407         as_bad (_("unknown relocation (%u)"), other);
3408       else if (size != bfd_get_reloc_size (rel))
3409         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3410                 bfd_get_reloc_size (rel),
3411                 size);
3412       else if (pcrel && !rel->pc_relative)
3413         as_bad (_("non-pc-relative relocation for pc-relative field"));
3414       else if ((rel->complain_on_overflow == complain_overflow_signed
3415                 && !sign)
3416                || (rel->complain_on_overflow == complain_overflow_unsigned
3417                    && sign > 0))
3418         as_bad (_("relocated field and relocation type differ in signedness"));
3419       else
3420         return other;
3421       return NO_RELOC;
3422     }
3423
3424   if (pcrel)
3425     {
3426       if (!sign)
3427         as_bad (_("there are no unsigned pc-relative relocations"));
3428       switch (size)
3429         {
3430         case 1: return BFD_RELOC_8_PCREL;
3431         case 2: return BFD_RELOC_16_PCREL;
3432         case 4: return BFD_RELOC_32_PCREL;
3433         case 8: return BFD_RELOC_64_PCREL;
3434         }
3435       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3436     }
3437   else
3438     {
3439       if (sign > 0)
3440         switch (size)
3441           {
3442           case 4: return BFD_RELOC_X86_64_32S;
3443           }
3444       else
3445         switch (size)
3446           {
3447           case 1: return BFD_RELOC_8;
3448           case 2: return BFD_RELOC_16;
3449           case 4: return BFD_RELOC_32;
3450           case 8: return BFD_RELOC_64;
3451           }
3452       as_bad (_("cannot do %s %u byte relocation"),
3453               sign > 0 ? "signed" : "unsigned", size);
3454     }
3455
3456   return NO_RELOC;
3457 }
3458
3459 /* Here we decide which fixups can be adjusted to make them relative to
3460    the beginning of the section instead of the symbol.  Basically we need
3461    to make sure that the dynamic relocations are done correctly, so in
3462    some cases we force the original symbol to be used.  */
3463
3464 int
3465 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3466 {
3467 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3468   if (!IS_ELF)
3469     return 1;
3470
3471   /* Don't adjust pc-relative references to merge sections in 64-bit
3472      mode.  */
3473   if (use_rela_relocations
3474       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3475       && fixP->fx_pcrel)
3476     return 0;
3477
3478   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3479      and changed later by validate_fix.  */
3480   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3481       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3482     return 0;
3483
3484   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3485      for size relocations.  */
3486   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3487       || fixP->fx_r_type == BFD_RELOC_SIZE64
3488       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3489       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3490       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3491       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3492       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3493       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3494       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3495       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3496       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3497       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3498       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3499       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3500       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3501       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3502       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3503       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3504       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3505       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3506       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3507       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3508       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3509       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3510       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3511       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3512       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3513       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3514       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3515       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3516       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3517     return 0;
3518 #endif
3519   return 1;
3520 }
3521
3522 static int
3523 intel_float_operand (const char *mnemonic)
3524 {
3525   /* Note that the value returned is meaningful only for opcodes with (memory)
3526      operands, hence the code here is free to improperly handle opcodes that
3527      have no operands (for better performance and smaller code). */
3528
3529   if (mnemonic[0] != 'f')
3530     return 0; /* non-math */
3531
3532   switch (mnemonic[1])
3533     {
3534     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3535        the fs segment override prefix not currently handled because no
3536        call path can make opcodes without operands get here */
3537     case 'i':
3538       return 2 /* integer op */;
3539     case 'l':
3540       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3541         return 3; /* fldcw/fldenv */
3542       break;
3543     case 'n':
3544       if (mnemonic[2] != 'o' /* fnop */)
3545         return 3; /* non-waiting control op */
3546       break;
3547     case 'r':
3548       if (mnemonic[2] == 's')
3549         return 3; /* frstor/frstpm */
3550       break;
3551     case 's':
3552       if (mnemonic[2] == 'a')
3553         return 3; /* fsave */
3554       if (mnemonic[2] == 't')
3555         {
3556           switch (mnemonic[3])
3557             {
3558             case 'c': /* fstcw */
3559             case 'd': /* fstdw */
3560             case 'e': /* fstenv */
3561             case 's': /* fsts[gw] */
3562               return 3;
3563             }
3564         }
3565       break;
3566     case 'x':
3567       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3568         return 0; /* fxsave/fxrstor are not really math ops */
3569       break;
3570     }
3571
3572   return 1;
3573 }
3574
3575 /* Build the VEX prefix.  */
3576
3577 static void
3578 build_vex_prefix (const insn_template *t)
3579 {
3580   unsigned int register_specifier;
3581   unsigned int implied_prefix;
3582   unsigned int vector_length;
3583   unsigned int w;
3584
3585   /* Check register specifier.  */
3586   if (i.vex.register_specifier)
3587     {
3588       register_specifier =
3589         ~register_number (i.vex.register_specifier) & 0xf;
3590       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3591     }
3592   else
3593     register_specifier = 0xf;
3594
3595   /* Use 2-byte VEX prefix by swapping destination and source operand
3596      if there are more than 1 register operand.  */
3597   if (i.reg_operands > 1
3598       && i.vec_encoding != vex_encoding_vex3
3599       && i.dir_encoding == dir_encoding_default
3600       && i.operands == i.reg_operands
3601       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3602       && i.tm.opcode_modifier.opcodeprefix == VEX0F
3603       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3604       && i.rex == REX_B)
3605     {
3606       unsigned int xchg = i.operands - 1;
3607       union i386_op temp_op;
3608       i386_operand_type temp_type;
3609
3610       temp_type = i.types[xchg];
3611       i.types[xchg] = i.types[0];
3612       i.types[0] = temp_type;
3613       temp_op = i.op[xchg];
3614       i.op[xchg] = i.op[0];
3615       i.op[0] = temp_op;
3616
3617       gas_assert (i.rm.mode == 3);
3618
3619       i.rex = REX_R;
3620       xchg = i.rm.regmem;
3621       i.rm.regmem = i.rm.reg;
3622       i.rm.reg = xchg;
3623
3624       if (i.tm.opcode_modifier.d)
3625         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3626                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3627       else /* Use the next insn.  */
3628         i.tm = t[1];
3629     }
3630
3631   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3632      are no memory operands and at least 3 register ones.  */
3633   if (i.reg_operands >= 3
3634       && i.vec_encoding != vex_encoding_vex3
3635       && i.reg_operands == i.operands - i.imm_operands
3636       && i.tm.opcode_modifier.vex
3637       && i.tm.opcode_modifier.commutative
3638       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3639       && i.rex == REX_B
3640       && i.vex.register_specifier
3641       && !(i.vex.register_specifier->reg_flags & RegRex))
3642     {
3643       unsigned int xchg = i.operands - i.reg_operands;
3644       union i386_op temp_op;
3645       i386_operand_type temp_type;
3646
3647       gas_assert (i.tm.opcode_modifier.opcodeprefix == VEX0F);
3648       gas_assert (!i.tm.opcode_modifier.sae);
3649       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3650                                       &i.types[i.operands - 3]));
3651       gas_assert (i.rm.mode == 3);
3652
3653       temp_type = i.types[xchg];
3654       i.types[xchg] = i.types[xchg + 1];
3655       i.types[xchg + 1] = temp_type;
3656       temp_op = i.op[xchg];
3657       i.op[xchg] = i.op[xchg + 1];
3658       i.op[xchg + 1] = temp_op;
3659
3660       i.rex = 0;
3661       xchg = i.rm.regmem | 8;
3662       i.rm.regmem = ~register_specifier & 0xf;
3663       gas_assert (!(i.rm.regmem & 8));
3664       i.vex.register_specifier += xchg - i.rm.regmem;
3665       register_specifier = ~xchg & 0xf;
3666     }
3667
3668   if (i.tm.opcode_modifier.vex == VEXScalar)
3669     vector_length = avxscalar;
3670   else if (i.tm.opcode_modifier.vex == VEX256)
3671     vector_length = 1;
3672   else
3673     {
3674       unsigned int op;
3675
3676       /* Determine vector length from the last multi-length vector
3677          operand.  */
3678       vector_length = 0;
3679       for (op = t->operands; op--;)
3680         if (t->operand_types[op].bitfield.xmmword
3681             && t->operand_types[op].bitfield.ymmword
3682             && i.types[op].bitfield.ymmword)
3683           {
3684             vector_length = 1;
3685             break;
3686           }
3687     }
3688
3689   switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
3690     {
3691     case 0:
3692       implied_prefix = 0;
3693       break;
3694     case DATA_PREFIX_OPCODE:
3695       implied_prefix = 1;
3696       break;
3697     case REPE_PREFIX_OPCODE:
3698       implied_prefix = 2;
3699       break;
3700     case REPNE_PREFIX_OPCODE:
3701       implied_prefix = 3;
3702       break;
3703     default:
3704       abort ();
3705     }
3706
3707   /* Check the REX.W bit and VEXW.  */
3708   if (i.tm.opcode_modifier.vexw == VEXWIG)
3709     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3710   else if (i.tm.opcode_modifier.vexw)
3711     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3712   else
3713     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3714
3715   /* Use 2-byte VEX prefix if possible.  */
3716   if (w == 0
3717       && i.vec_encoding != vex_encoding_vex3
3718       && i.tm.opcode_modifier.opcodeprefix == VEX0F
3719       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3720     {
3721       /* 2-byte VEX prefix.  */
3722       unsigned int r;
3723
3724       i.vex.length = 2;
3725       i.vex.bytes[0] = 0xc5;
3726
3727       /* Check the REX.R bit.  */
3728       r = (i.rex & REX_R) ? 0 : 1;
3729       i.vex.bytes[1] = (r << 7
3730                         | register_specifier << 3
3731                         | vector_length << 2
3732                         | implied_prefix);
3733     }
3734   else
3735     {
3736       /* 3-byte VEX prefix.  */
3737       unsigned int m;
3738
3739       i.vex.length = 3;
3740
3741       switch (i.tm.opcode_modifier.opcodeprefix)
3742         {
3743         case VEX0F:
3744           m = 0x1;
3745           i.vex.bytes[0] = 0xc4;
3746           break;
3747         case VEX0F38:
3748           m = 0x2;
3749           i.vex.bytes[0] = 0xc4;
3750           break;
3751         case VEX0F3A:
3752           m = 0x3;
3753           i.vex.bytes[0] = 0xc4;
3754           break;
3755         case XOP08:
3756           m = 0x8;
3757           i.vex.bytes[0] = 0x8f;
3758           break;
3759         case XOP09:
3760           m = 0x9;
3761           i.vex.bytes[0] = 0x8f;
3762           break;
3763         case XOP0A:
3764           m = 0xa;
3765           i.vex.bytes[0] = 0x8f;
3766           break;
3767         default:
3768           abort ();
3769         }
3770
3771       /* The high 3 bits of the second VEX byte are 1's compliment
3772          of RXB bits from REX.  */
3773       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3774
3775       i.vex.bytes[2] = (w << 7
3776                         | register_specifier << 3
3777                         | vector_length << 2
3778                         | implied_prefix);
3779     }
3780 }
3781
3782 static INLINE bfd_boolean
3783 is_evex_encoding (const insn_template *t)
3784 {
3785   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3786          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3787          || t->opcode_modifier.sae;
3788 }
3789
3790 static INLINE bfd_boolean
3791 is_any_vex_encoding (const insn_template *t)
3792 {
3793   return t->opcode_modifier.vex || is_evex_encoding (t);
3794 }
3795
3796 /* Build the EVEX prefix.  */
3797
3798 static void
3799 build_evex_prefix (void)
3800 {
3801   unsigned int register_specifier;
3802   unsigned int implied_prefix;
3803   unsigned int m, w;
3804   rex_byte vrex_used = 0;
3805
3806   /* Check register specifier.  */
3807   if (i.vex.register_specifier)
3808     {
3809       gas_assert ((i.vrex & REX_X) == 0);
3810
3811       register_specifier = i.vex.register_specifier->reg_num;
3812       if ((i.vex.register_specifier->reg_flags & RegRex))
3813         register_specifier += 8;
3814       /* The upper 16 registers are encoded in the fourth byte of the
3815          EVEX prefix.  */
3816       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3817         i.vex.bytes[3] = 0x8;
3818       register_specifier = ~register_specifier & 0xf;
3819     }
3820   else
3821     {
3822       register_specifier = 0xf;
3823
3824       /* Encode upper 16 vector index register in the fourth byte of
3825          the EVEX prefix.  */
3826       if (!(i.vrex & REX_X))
3827         i.vex.bytes[3] = 0x8;
3828       else
3829         vrex_used |= REX_X;
3830     }
3831
3832   switch ((i.tm.base_opcode >> 8) & 0xff)
3833     {
3834     case 0:
3835       implied_prefix = 0;
3836       break;
3837     case DATA_PREFIX_OPCODE:
3838       implied_prefix = 1;
3839       break;
3840     case REPE_PREFIX_OPCODE:
3841       implied_prefix = 2;
3842       break;
3843     case REPNE_PREFIX_OPCODE:
3844       implied_prefix = 3;
3845       break;
3846     default:
3847       abort ();
3848     }
3849
3850   /* 4 byte EVEX prefix.  */
3851   i.vex.length = 4;
3852   i.vex.bytes[0] = 0x62;
3853
3854   /* mmmm bits.  */
3855   switch (i.tm.opcode_modifier.opcodeprefix)
3856     {
3857     case VEX0F:
3858       m = 1;
3859       break;
3860     case VEX0F38:
3861       m = 2;
3862       break;
3863     case VEX0F3A:
3864       m = 3;
3865       break;
3866     default:
3867       abort ();
3868       break;
3869     }
3870
3871   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3872      bits from REX.  */
3873   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3874
3875   /* The fifth bit of the second EVEX byte is 1's compliment of the
3876      REX_R bit in VREX.  */
3877   if (!(i.vrex & REX_R))
3878     i.vex.bytes[1] |= 0x10;
3879   else
3880     vrex_used |= REX_R;
3881
3882   if ((i.reg_operands + i.imm_operands) == i.operands)
3883     {
3884       /* When all operands are registers, the REX_X bit in REX is not
3885          used.  We reuse it to encode the upper 16 registers, which is
3886          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3887          as 1's compliment.  */
3888       if ((i.vrex & REX_B))
3889         {
3890           vrex_used |= REX_B;
3891           i.vex.bytes[1] &= ~0x40;
3892         }
3893     }
3894
3895   /* EVEX instructions shouldn't need the REX prefix.  */
3896   i.vrex &= ~vrex_used;
3897   gas_assert (i.vrex == 0);
3898
3899   /* Check the REX.W bit and VEXW.  */
3900   if (i.tm.opcode_modifier.vexw == VEXWIG)
3901     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3902   else if (i.tm.opcode_modifier.vexw)
3903     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3904   else
3905     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3906
3907   /* Encode the U bit.  */
3908   implied_prefix |= 0x4;
3909
3910   /* The third byte of the EVEX prefix.  */
3911   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3912
3913   /* The fourth byte of the EVEX prefix.  */
3914   /* The zeroing-masking bit.  */
3915   if (i.mask && i.mask->zeroing)
3916     i.vex.bytes[3] |= 0x80;
3917
3918   /* Don't always set the broadcast bit if there is no RC.  */
3919   if (!i.rounding)
3920     {
3921       /* Encode the vector length.  */
3922       unsigned int vec_length;
3923
3924       if (!i.tm.opcode_modifier.evex
3925           || i.tm.opcode_modifier.evex == EVEXDYN)
3926         {
3927           unsigned int op;
3928
3929           /* Determine vector length from the last multi-length vector
3930              operand.  */
3931           for (op = i.operands; op--;)
3932             if (i.tm.operand_types[op].bitfield.xmmword
3933                 + i.tm.operand_types[op].bitfield.ymmword
3934                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3935               {
3936                 if (i.types[op].bitfield.zmmword)
3937                   {
3938                     i.tm.opcode_modifier.evex = EVEX512;
3939                     break;
3940                   }
3941                 else if (i.types[op].bitfield.ymmword)
3942                   {
3943                     i.tm.opcode_modifier.evex = EVEX256;
3944                     break;
3945                   }
3946                 else if (i.types[op].bitfield.xmmword)
3947                   {
3948                     i.tm.opcode_modifier.evex = EVEX128;
3949                     break;
3950                   }
3951                 else if (i.broadcast && (int) op == i.broadcast->operand)
3952                   {
3953                     switch (i.broadcast->bytes)
3954                       {
3955                         case 64:
3956                           i.tm.opcode_modifier.evex = EVEX512;
3957                           break;
3958                         case 32:
3959                           i.tm.opcode_modifier.evex = EVEX256;
3960                           break;
3961                         case 16:
3962                           i.tm.opcode_modifier.evex = EVEX128;
3963                           break;
3964                         default:
3965                           abort ();
3966                       }
3967                     break;
3968                   }
3969               }
3970
3971           if (op >= MAX_OPERANDS)
3972             abort ();
3973         }
3974
3975       switch (i.tm.opcode_modifier.evex)
3976         {
3977         case EVEXLIG: /* LL' is ignored */
3978           vec_length = evexlig << 5;
3979           break;
3980         case EVEX128:
3981           vec_length = 0 << 5;
3982           break;
3983         case EVEX256:
3984           vec_length = 1 << 5;
3985           break;
3986         case EVEX512:
3987           vec_length = 2 << 5;
3988           break;
3989         default:
3990           abort ();
3991           break;
3992         }
3993       i.vex.bytes[3] |= vec_length;
3994       /* Encode the broadcast bit.  */
3995       if (i.broadcast)
3996         i.vex.bytes[3] |= 0x10;
3997     }
3998   else
3999     {
4000       if (i.rounding->type != saeonly)
4001         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
4002       else
4003         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
4004     }
4005
4006   if (i.mask && i.mask->mask)
4007     i.vex.bytes[3] |= i.mask->mask->reg_num;
4008 }
4009
4010 static void
4011 process_immext (void)
4012 {
4013   expressionS *exp;
4014
4015   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
4016      which is coded in the same place as an 8-bit immediate field
4017      would be.  Here we fake an 8-bit immediate operand from the
4018      opcode suffix stored in tm.extension_opcode.
4019
4020      AVX instructions also use this encoding, for some of
4021      3 argument instructions.  */
4022
4023   gas_assert (i.imm_operands <= 1
4024               && (i.operands <= 2
4025                   || (is_any_vex_encoding (&i.tm)
4026                       && i.operands <= 4)));
4027
4028   exp = &im_expressions[i.imm_operands++];
4029   i.op[i.operands].imms = exp;
4030   i.types[i.operands] = imm8;
4031   i.operands++;
4032   exp->X_op = O_constant;
4033   exp->X_add_number = i.tm.extension_opcode;
4034   i.tm.extension_opcode = None;
4035 }
4036
4037
4038 static int
4039 check_hle (void)
4040 {
4041   switch (i.tm.opcode_modifier.prefixok)
4042     {
4043     default:
4044       abort ();
4045     case PrefixLock:
4046     case PrefixNone:
4047     case PrefixNoTrack:
4048     case PrefixRep:
4049       as_bad (_("invalid instruction `%s' after `%s'"),
4050               i.tm.name, i.hle_prefix);
4051       return 0;
4052     case PrefixHLELock:
4053       if (i.prefix[LOCK_PREFIX])
4054         return 1;
4055       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4056       return 0;
4057     case PrefixHLEAny:
4058       return 1;
4059     case PrefixHLERelease:
4060       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4061         {
4062           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4063                   i.tm.name);
4064           return 0;
4065         }
4066       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4067         {
4068           as_bad (_("memory destination needed for instruction `%s'"
4069                     " after `xrelease'"), i.tm.name);
4070           return 0;
4071         }
4072       return 1;
4073     }
4074 }
4075
4076 /* Try the shortest encoding by shortening operand size.  */
4077
4078 static void
4079 optimize_encoding (void)
4080 {
4081   unsigned int j;
4082
4083   if (optimize_for_space
4084       && !is_any_vex_encoding (&i.tm)
4085       && i.reg_operands == 1
4086       && i.imm_operands == 1
4087       && !i.types[1].bitfield.byte
4088       && i.op[0].imms->X_op == O_constant
4089       && fits_in_imm7 (i.op[0].imms->X_add_number)
4090       && (i.tm.base_opcode == 0xa8
4091           || (i.tm.base_opcode == 0xf6
4092               && i.tm.extension_opcode == 0x0)))
4093     {
4094       /* Optimize: -Os:
4095            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4096        */
4097       unsigned int base_regnum = i.op[1].regs->reg_num;
4098       if (flag_code == CODE_64BIT || base_regnum < 4)
4099         {
4100           i.types[1].bitfield.byte = 1;
4101           /* Ignore the suffix.  */
4102           i.suffix = 0;
4103           /* Convert to byte registers.  */
4104           if (i.types[1].bitfield.word)
4105             j = 16;
4106           else if (i.types[1].bitfield.dword)
4107             j = 32;
4108           else
4109             j = 48;
4110           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4111             j += 8;
4112           i.op[1].regs -= j;
4113         }
4114     }
4115   else if (flag_code == CODE_64BIT
4116            && !is_any_vex_encoding (&i.tm)
4117            && ((i.types[1].bitfield.qword
4118                 && i.reg_operands == 1
4119                 && i.imm_operands == 1
4120                 && i.op[0].imms->X_op == O_constant
4121                 && ((i.tm.base_opcode == 0xb8
4122                      && i.tm.extension_opcode == None
4123                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4124                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4125                         && ((i.tm.base_opcode == 0x24
4126                              || i.tm.base_opcode == 0xa8)
4127                             || (i.tm.base_opcode == 0x80
4128                                 && i.tm.extension_opcode == 0x4)
4129                             || ((i.tm.base_opcode == 0xf6
4130                                  || (i.tm.base_opcode | 1) == 0xc7)
4131                                 && i.tm.extension_opcode == 0x0)))
4132                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4133                         && i.tm.base_opcode == 0x83
4134                         && i.tm.extension_opcode == 0x4)))
4135                || (i.types[0].bitfield.qword
4136                    && ((i.reg_operands == 2
4137                         && i.op[0].regs == i.op[1].regs
4138                         && (i.tm.base_opcode == 0x30
4139                             || i.tm.base_opcode == 0x28))
4140                        || (i.reg_operands == 1
4141                            && i.operands == 1
4142                            && i.tm.base_opcode == 0x30)))))
4143     {
4144       /* Optimize: -O:
4145            andq $imm31, %r64   -> andl $imm31, %r32
4146            andq $imm7, %r64    -> andl $imm7, %r32
4147            testq $imm31, %r64  -> testl $imm31, %r32
4148            xorq %r64, %r64     -> xorl %r32, %r32
4149            subq %r64, %r64     -> subl %r32, %r32
4150            movq $imm31, %r64   -> movl $imm31, %r32
4151            movq $imm32, %r64   -> movl $imm32, %r32
4152         */
4153       i.tm.opcode_modifier.norex64 = 1;
4154       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4155         {
4156           /* Handle
4157                movq $imm31, %r64   -> movl $imm31, %r32
4158                movq $imm32, %r64   -> movl $imm32, %r32
4159            */
4160           i.tm.operand_types[0].bitfield.imm32 = 1;
4161           i.tm.operand_types[0].bitfield.imm32s = 0;
4162           i.tm.operand_types[0].bitfield.imm64 = 0;
4163           i.types[0].bitfield.imm32 = 1;
4164           i.types[0].bitfield.imm32s = 0;
4165           i.types[0].bitfield.imm64 = 0;
4166           i.types[1].bitfield.dword = 1;
4167           i.types[1].bitfield.qword = 0;
4168           if ((i.tm.base_opcode | 1) == 0xc7)
4169             {
4170               /* Handle
4171                    movq $imm31, %r64   -> movl $imm31, %r32
4172                */
4173               i.tm.base_opcode = 0xb8;
4174               i.tm.extension_opcode = None;
4175               i.tm.opcode_modifier.w = 0;
4176               i.tm.opcode_modifier.modrm = 0;
4177             }
4178         }
4179     }
4180   else if (optimize > 1
4181            && !optimize_for_space
4182            && !is_any_vex_encoding (&i.tm)
4183            && i.reg_operands == 2
4184            && i.op[0].regs == i.op[1].regs
4185            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4186                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4187            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4188     {
4189       /* Optimize: -O2:
4190            andb %rN, %rN  -> testb %rN, %rN
4191            andw %rN, %rN  -> testw %rN, %rN
4192            andq %rN, %rN  -> testq %rN, %rN
4193            orb %rN, %rN   -> testb %rN, %rN
4194            orw %rN, %rN   -> testw %rN, %rN
4195            orq %rN, %rN   -> testq %rN, %rN
4196
4197            and outside of 64-bit mode
4198
4199            andl %rN, %rN  -> testl %rN, %rN
4200            orl %rN, %rN   -> testl %rN, %rN
4201        */
4202       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4203     }
4204   else if (i.reg_operands == 3
4205            && i.op[0].regs == i.op[1].regs
4206            && !i.types[2].bitfield.xmmword
4207            && (i.tm.opcode_modifier.vex
4208                || ((!i.mask || i.mask->zeroing)
4209                    && !i.rounding
4210                    && is_evex_encoding (&i.tm)
4211                    && (i.vec_encoding != vex_encoding_evex
4212                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4213                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4214                        || (i.tm.operand_types[2].bitfield.zmmword
4215                            && i.types[2].bitfield.ymmword))))
4216            && ((i.tm.base_opcode == 0x55
4217                 || i.tm.base_opcode == 0x6655
4218                 || i.tm.base_opcode == 0x66df
4219                 || i.tm.base_opcode == 0x57
4220                 || i.tm.base_opcode == 0x6657
4221                 || i.tm.base_opcode == 0x66ef
4222                 || i.tm.base_opcode == 0x66f8
4223                 || i.tm.base_opcode == 0x66f9
4224                 || i.tm.base_opcode == 0x66fa
4225                 || i.tm.base_opcode == 0x66fb
4226                 || i.tm.base_opcode == 0x42
4227                 || i.tm.base_opcode == 0x6642
4228                 || i.tm.base_opcode == 0x47
4229                 || i.tm.base_opcode == 0x6647)
4230                && i.tm.extension_opcode == None))
4231     {
4232       /* Optimize: -O1:
4233            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4234            vpsubq and vpsubw:
4235              EVEX VOP %zmmM, %zmmM, %zmmN
4236                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4237                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4238              EVEX VOP %ymmM, %ymmM, %ymmN
4239                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4240                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4241              VEX VOP %ymmM, %ymmM, %ymmN
4242                -> VEX VOP %xmmM, %xmmM, %xmmN
4243            VOP, one of vpandn and vpxor:
4244              VEX VOP %ymmM, %ymmM, %ymmN
4245                -> VEX VOP %xmmM, %xmmM, %xmmN
4246            VOP, one of vpandnd and vpandnq:
4247              EVEX VOP %zmmM, %zmmM, %zmmN
4248                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4249                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4250              EVEX VOP %ymmM, %ymmM, %ymmN
4251                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4252                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4253            VOP, one of vpxord and vpxorq:
4254              EVEX VOP %zmmM, %zmmM, %zmmN
4255                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4256                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4257              EVEX VOP %ymmM, %ymmM, %ymmN
4258                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4259                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4260            VOP, one of kxord and kxorq:
4261              VEX VOP %kM, %kM, %kN
4262                -> VEX kxorw %kM, %kM, %kN
4263            VOP, one of kandnd and kandnq:
4264              VEX VOP %kM, %kM, %kN
4265                -> VEX kandnw %kM, %kM, %kN
4266        */
4267       if (is_evex_encoding (&i.tm))
4268         {
4269           if (i.vec_encoding != vex_encoding_evex)
4270             {
4271               i.tm.opcode_modifier.vex = VEX128;
4272               i.tm.opcode_modifier.vexw = VEXW0;
4273               i.tm.opcode_modifier.evex = 0;
4274             }
4275           else if (optimize > 1)
4276             i.tm.opcode_modifier.evex = EVEX128;
4277           else
4278             return;
4279         }
4280       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4281         {
4282           i.tm.base_opcode &= 0xff;
4283           i.tm.opcode_modifier.vexw = VEXW0;
4284         }
4285       else
4286         i.tm.opcode_modifier.vex = VEX128;
4287
4288       if (i.tm.opcode_modifier.vex)
4289         for (j = 0; j < 3; j++)
4290           {
4291             i.types[j].bitfield.xmmword = 1;
4292             i.types[j].bitfield.ymmword = 0;
4293           }
4294     }
4295   else if (i.vec_encoding != vex_encoding_evex
4296            && !i.types[0].bitfield.zmmword
4297            && !i.types[1].bitfield.zmmword
4298            && !i.mask
4299            && !i.broadcast
4300            && is_evex_encoding (&i.tm)
4301            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4302                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4303                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4304                || (i.tm.base_opcode & ~4) == 0x66db
4305                || (i.tm.base_opcode & ~4) == 0x66eb)
4306            && i.tm.extension_opcode == None)
4307     {
4308       /* Optimize: -O1:
4309            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4310            vmovdqu32 and vmovdqu64:
4311              EVEX VOP %xmmM, %xmmN
4312                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4313              EVEX VOP %ymmM, %ymmN
4314                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4315              EVEX VOP %xmmM, mem
4316                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4317              EVEX VOP %ymmM, mem
4318                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4319              EVEX VOP mem, %xmmN
4320                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4321              EVEX VOP mem, %ymmN
4322                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4323            VOP, one of vpand, vpandn, vpor, vpxor:
4324              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4325                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4326              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4327                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4328              EVEX VOP{d,q} mem, %xmmM, %xmmN
4329                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4330              EVEX VOP{d,q} mem, %ymmM, %ymmN
4331                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4332        */
4333       for (j = 0; j < i.operands; j++)
4334         if (operand_type_check (i.types[j], disp)
4335             && i.op[j].disps->X_op == O_constant)
4336           {
4337             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4338                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4339                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4340             int evex_disp8, vex_disp8;
4341             unsigned int memshift = i.memshift;
4342             offsetT n = i.op[j].disps->X_add_number;
4343
4344             evex_disp8 = fits_in_disp8 (n);
4345             i.memshift = 0;
4346             vex_disp8 = fits_in_disp8 (n);
4347             if (evex_disp8 != vex_disp8)
4348               {
4349                 i.memshift = memshift;
4350                 return;
4351               }
4352
4353             i.types[j].bitfield.disp8 = vex_disp8;
4354             break;
4355           }
4356       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4357         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4358       i.tm.opcode_modifier.vex
4359         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4360       i.tm.opcode_modifier.vexw = VEXW0;
4361       /* VPAND, VPOR, and VPXOR are commutative.  */
4362       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4363         i.tm.opcode_modifier.commutative = 1;
4364       i.tm.opcode_modifier.evex = 0;
4365       i.tm.opcode_modifier.masking = 0;
4366       i.tm.opcode_modifier.broadcast = 0;
4367       i.tm.opcode_modifier.disp8memshift = 0;
4368       i.memshift = 0;
4369       if (j < i.operands)
4370         i.types[j].bitfield.disp8
4371           = fits_in_disp8 (i.op[j].disps->X_add_number);
4372     }
4373 }
4374
4375 /* Return non-zero for load instruction.  */
4376
4377 static int
4378 load_insn_p (void)
4379 {
4380   unsigned int dest;
4381   int any_vex_p = is_any_vex_encoding (&i.tm);
4382   unsigned int base_opcode = i.tm.base_opcode | 1;
4383
4384   if (!any_vex_p)
4385     {
4386       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4387          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4388          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4389       if (i.tm.opcode_modifier.anysize)
4390         return 0;
4391
4392       /* pop, popf, popa.   */
4393       if (strcmp (i.tm.name, "pop") == 0
4394           || i.tm.base_opcode == 0x9d
4395           || i.tm.base_opcode == 0x61)
4396         return 1;
4397
4398       /* movs, cmps, lods, scas.  */
4399       if ((i.tm.base_opcode | 0xb) == 0xaf)
4400         return 1;
4401
4402       /* outs, xlatb.  */
4403       if (base_opcode == 0x6f
4404           || i.tm.base_opcode == 0xd7)
4405         return 1;
4406       /* NB: For AMD-specific insns with implicit memory operands,
4407          they're intentionally not covered.  */
4408     }
4409
4410   /* No memory operand.  */
4411   if (!i.mem_operands)
4412     return 0;
4413
4414   if (any_vex_p)
4415     {
4416       /* vldmxcsr.  */
4417       if (i.tm.base_opcode == 0xae
4418           && i.tm.opcode_modifier.vex
4419           && i.tm.opcode_modifier.opcodeprefix == VEX0F
4420           && i.tm.extension_opcode == 2)
4421         return 1;
4422     }
4423   else
4424     {
4425       /* test, not, neg, mul, imul, div, idiv.  */
4426       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4427           && i.tm.extension_opcode != 1)
4428         return 1;
4429
4430       /* inc, dec.  */
4431       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4432         return 1;
4433
4434       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4435       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4436         return 1;
4437
4438       /* bt, bts, btr, btc.  */
4439       if (i.tm.base_opcode == 0xfba
4440           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4441         return 1;
4442
4443       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4444       if ((base_opcode == 0xc1
4445            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4446           && i.tm.extension_opcode != 6)
4447         return 1;
4448
4449       /* cmpxchg8b, cmpxchg16b, xrstors.  */
4450       if (i.tm.base_opcode == 0xfc7
4451           && i.tm.opcode_modifier.opcodeprefix == 0
4452           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4453         return 1;
4454
4455       /* fxrstor, ldmxcsr, xrstor.  */
4456       if (i.tm.base_opcode == 0xfae
4457           && (i.tm.extension_opcode == 1
4458               || i.tm.extension_opcode == 2
4459               || i.tm.extension_opcode == 5))
4460         return 1;
4461
4462       /* lgdt, lidt, lmsw.  */
4463       if (i.tm.base_opcode == 0xf01
4464           && (i.tm.extension_opcode == 2
4465               || i.tm.extension_opcode == 3
4466               || i.tm.extension_opcode == 6))
4467         return 1;
4468
4469       /* vmptrld */
4470       if (i.tm.base_opcode == 0xfc7
4471           && i.tm.opcode_modifier.opcodeprefix == 0
4472           && i.tm.extension_opcode == 6)
4473         return 1;
4474
4475       /* Check for x87 instructions.  */
4476       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4477         {
4478           /* Skip fst, fstp, fstenv, fstcw.  */
4479           if (i.tm.base_opcode == 0xd9
4480               && (i.tm.extension_opcode == 2
4481                   || i.tm.extension_opcode == 3
4482                   || i.tm.extension_opcode == 6
4483                   || i.tm.extension_opcode == 7))
4484             return 0;
4485
4486           /* Skip fisttp, fist, fistp, fstp.  */
4487           if (i.tm.base_opcode == 0xdb
4488               && (i.tm.extension_opcode == 1
4489                   || i.tm.extension_opcode == 2
4490                   || i.tm.extension_opcode == 3
4491                   || i.tm.extension_opcode == 7))
4492             return 0;
4493
4494           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4495           if (i.tm.base_opcode == 0xdd
4496               && (i.tm.extension_opcode == 1
4497                   || i.tm.extension_opcode == 2
4498                   || i.tm.extension_opcode == 3
4499                   || i.tm.extension_opcode == 6
4500                   || i.tm.extension_opcode == 7))
4501             return 0;
4502
4503           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4504           if (i.tm.base_opcode == 0xdf
4505               && (i.tm.extension_opcode == 1
4506                   || i.tm.extension_opcode == 2
4507                   || i.tm.extension_opcode == 3
4508                   || i.tm.extension_opcode == 6
4509                   || i.tm.extension_opcode == 7))
4510             return 0;
4511
4512           return 1;
4513         }
4514     }
4515
4516   dest = i.operands - 1;
4517
4518   /* Check fake imm8 operand and 3 source operands.  */
4519   if ((i.tm.opcode_modifier.immext
4520        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4521       && i.types[dest].bitfield.imm8)
4522     dest--;
4523
4524   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4525   if (!any_vex_p
4526       && (base_opcode == 0x1
4527           || base_opcode == 0x9
4528           || base_opcode == 0x11
4529           || base_opcode == 0x19
4530           || base_opcode == 0x21
4531           || base_opcode == 0x29
4532           || base_opcode == 0x31
4533           || base_opcode == 0x39
4534           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4535           || base_opcode == 0xfc1))
4536     return 1;
4537
4538   /* Check for load instruction.  */
4539   return (i.types[dest].bitfield.class != ClassNone
4540           || i.types[dest].bitfield.instance == Accum);
4541 }
4542
4543 /* Output lfence, 0xfaee8, after instruction.  */
4544
4545 static void
4546 insert_lfence_after (void)
4547 {
4548   if (lfence_after_load && load_insn_p ())
4549     {
4550       /* There are also two REP string instructions that require
4551          special treatment. Specifically, the compare string (CMPS)
4552          and scan string (SCAS) instructions set EFLAGS in a manner
4553          that depends on the data being compared/scanned. When used
4554          with a REP prefix, the number of iterations may therefore
4555          vary depending on this data. If the data is a program secret
4556          chosen by the adversary using an LVI method,
4557          then this data-dependent behavior may leak some aspect
4558          of the secret.  */
4559       if (((i.tm.base_opcode | 0x1) == 0xa7
4560            || (i.tm.base_opcode | 0x1) == 0xaf)
4561           && i.prefix[REP_PREFIX])
4562         {
4563             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4564                      i.tm.name);
4565         }
4566       char *p = frag_more (3);
4567       *p++ = 0xf;
4568       *p++ = 0xae;
4569       *p = 0xe8;
4570     }
4571 }
4572
4573 /* Output lfence, 0xfaee8, before instruction.  */
4574
4575 static void
4576 insert_lfence_before (void)
4577 {
4578   char *p;
4579
4580   if (is_any_vex_encoding (&i.tm))
4581     return;
4582
4583   if (i.tm.base_opcode == 0xff
4584       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4585     {
4586       /* Insert lfence before indirect branch if needed.  */
4587
4588       if (lfence_before_indirect_branch == lfence_branch_none)
4589         return;
4590
4591       if (i.operands != 1)
4592         abort ();
4593
4594       if (i.reg_operands == 1)
4595         {
4596           /* Indirect branch via register.  Don't insert lfence with
4597              -mlfence-after-load=yes.  */
4598           if (lfence_after_load
4599               || lfence_before_indirect_branch == lfence_branch_memory)
4600             return;
4601         }
4602       else if (i.mem_operands == 1
4603                && lfence_before_indirect_branch != lfence_branch_register)
4604         {
4605           as_warn (_("indirect `%s` with memory operand should be avoided"),
4606                    i.tm.name);
4607           return;
4608         }
4609       else
4610         return;
4611
4612       if (last_insn.kind != last_insn_other
4613           && last_insn.seg == now_seg)
4614         {
4615           as_warn_where (last_insn.file, last_insn.line,
4616                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4617                          last_insn.name, i.tm.name);
4618           return;
4619         }
4620
4621       p = frag_more (3);
4622       *p++ = 0xf;
4623       *p++ = 0xae;
4624       *p = 0xe8;
4625       return;
4626     }
4627
4628   /* Output or/not/shl and lfence before near ret.  */
4629   if (lfence_before_ret != lfence_before_ret_none
4630       && (i.tm.base_opcode == 0xc2
4631           || i.tm.base_opcode == 0xc3))
4632     {
4633       if (last_insn.kind != last_insn_other
4634           && last_insn.seg == now_seg)
4635         {
4636           as_warn_where (last_insn.file, last_insn.line,
4637                          _("`%s` skips -mlfence-before-ret on `%s`"),
4638                          last_insn.name, i.tm.name);
4639           return;
4640         }
4641
4642       /* Near ret ingore operand size override under CPU64.  */
4643       char prefix = flag_code == CODE_64BIT
4644                     ? 0x48
4645                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4646
4647       if (lfence_before_ret == lfence_before_ret_not)
4648         {
4649           /* not: 0xf71424, may add prefix
4650              for operand size override or 64-bit code.  */
4651           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4652           if (prefix)
4653             *p++ = prefix;
4654           *p++ = 0xf7;
4655           *p++ = 0x14;
4656           *p++ = 0x24;
4657           if (prefix)
4658             *p++ = prefix;
4659           *p++ = 0xf7;
4660           *p++ = 0x14;
4661           *p++ = 0x24;
4662         }
4663       else
4664         {
4665           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4666           if (prefix)
4667             *p++ = prefix;
4668           if (lfence_before_ret == lfence_before_ret_or)
4669             {
4670               /* or: 0x830c2400, may add prefix
4671                  for operand size override or 64-bit code.  */
4672               *p++ = 0x83;
4673               *p++ = 0x0c;
4674             }
4675           else
4676             {
4677               /* shl: 0xc1242400, may add prefix
4678                  for operand size override or 64-bit code.  */
4679               *p++ = 0xc1;
4680               *p++ = 0x24;
4681             }
4682
4683           *p++ = 0x24;
4684           *p++ = 0x0;
4685         }
4686
4687       *p++ = 0xf;
4688       *p++ = 0xae;
4689       *p = 0xe8;
4690     }
4691 }
4692
4693 /* This is the guts of the machine-dependent assembler.  LINE points to a
4694    machine dependent instruction.  This function is supposed to emit
4695    the frags/bytes it assembles to.  */
4696
4697 void
4698 md_assemble (char *line)
4699 {
4700   unsigned int j;
4701   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4702   const insn_template *t;
4703
4704   /* Initialize globals.  */
4705   memset (&i, '\0', sizeof (i));
4706   for (j = 0; j < MAX_OPERANDS; j++)
4707     i.reloc[j] = NO_RELOC;
4708   memset (disp_expressions, '\0', sizeof (disp_expressions));
4709   memset (im_expressions, '\0', sizeof (im_expressions));
4710   save_stack_p = save_stack;
4711
4712   /* First parse an instruction mnemonic & call i386_operand for the operands.
4713      We assume that the scrubber has arranged it so that line[0] is the valid
4714      start of a (possibly prefixed) mnemonic.  */
4715
4716   line = parse_insn (line, mnemonic);
4717   if (line == NULL)
4718     return;
4719   mnem_suffix = i.suffix;
4720
4721   line = parse_operands (line, mnemonic);
4722   this_operand = -1;
4723   xfree (i.memop1_string);
4724   i.memop1_string = NULL;
4725   if (line == NULL)
4726     return;
4727
4728   /* Now we've parsed the mnemonic into a set of templates, and have the
4729      operands at hand.  */
4730
4731   /* All Intel opcodes have reversed operands except for "bound", "enter",
4732      "monitor*", "mwait*", "tpause", and "umwait".  We also don't reverse
4733      intersegment "jmp" and "call" instructions with 2 immediate operands so
4734      that the immediate segment precedes the offset, as it does when in AT&T
4735      mode.  */
4736   if (intel_syntax
4737       && i.operands > 1
4738       && (strcmp (mnemonic, "bound") != 0)
4739       && (strcmp (mnemonic, "invlpga") != 0)
4740       && (strncmp (mnemonic, "monitor", 7) != 0)
4741       && (strncmp (mnemonic, "mwait", 5) != 0)
4742       && (strcmp (mnemonic, "tpause") != 0)
4743       && (strcmp (mnemonic, "umwait") != 0)
4744       && !(operand_type_check (i.types[0], imm)
4745            && operand_type_check (i.types[1], imm)))
4746     swap_operands ();
4747
4748   /* The order of the immediates should be reversed
4749      for 2 immediates extrq and insertq instructions */
4750   if (i.imm_operands == 2
4751       && (strcmp (mnemonic, "extrq") == 0
4752           || strcmp (mnemonic, "insertq") == 0))
4753       swap_2_operands (0, 1);
4754
4755   if (i.imm_operands)
4756     optimize_imm ();
4757
4758   /* Don't optimize displacement for movabs since it only takes 64bit
4759      displacement.  */
4760   if (i.disp_operands
4761       && i.disp_encoding != disp_encoding_32bit
4762       && (flag_code != CODE_64BIT
4763           || strcmp (mnemonic, "movabs") != 0))
4764     optimize_disp ();
4765
4766   /* Next, we find a template that matches the given insn,
4767      making sure the overlap of the given operands types is consistent
4768      with the template operand types.  */
4769
4770   if (!(t = match_template (mnem_suffix)))
4771     return;
4772
4773   if (sse_check != check_none
4774       && !i.tm.opcode_modifier.noavx
4775       && !i.tm.cpu_flags.bitfield.cpuavx
4776       && !i.tm.cpu_flags.bitfield.cpuavx512f
4777       && (i.tm.cpu_flags.bitfield.cpusse
4778           || i.tm.cpu_flags.bitfield.cpusse2
4779           || i.tm.cpu_flags.bitfield.cpusse3
4780           || i.tm.cpu_flags.bitfield.cpussse3
4781           || i.tm.cpu_flags.bitfield.cpusse4_1
4782           || i.tm.cpu_flags.bitfield.cpusse4_2
4783           || i.tm.cpu_flags.bitfield.cpupclmul
4784           || i.tm.cpu_flags.bitfield.cpuaes
4785           || i.tm.cpu_flags.bitfield.cpusha
4786           || i.tm.cpu_flags.bitfield.cpugfni))
4787     {
4788       (sse_check == check_warning
4789        ? as_warn
4790        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4791     }
4792
4793   if (i.tm.opcode_modifier.fwait)
4794     if (!add_prefix (FWAIT_OPCODE))
4795       return;
4796
4797   /* Check if REP prefix is OK.  */
4798   if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4799     {
4800       as_bad (_("invalid instruction `%s' after `%s'"),
4801                 i.tm.name, i.rep_prefix);
4802       return;
4803     }
4804
4805   /* Check for lock without a lockable instruction.  Destination operand
4806      must be memory unless it is xchg (0x86).  */
4807   if (i.prefix[LOCK_PREFIX]
4808       && (i.tm.opcode_modifier.prefixok < PrefixLock
4809           || i.mem_operands == 0
4810           || (i.tm.base_opcode != 0x86
4811               && !(i.flags[i.operands - 1] & Operand_Mem))))
4812     {
4813       as_bad (_("expecting lockable instruction after `lock'"));
4814       return;
4815     }
4816
4817   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4818   if (i.prefix[DATA_PREFIX]
4819       && (is_any_vex_encoding (&i.tm)
4820           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4821           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4822     {
4823       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4824       return;
4825     }
4826
4827   /* Check if HLE prefix is OK.  */
4828   if (i.hle_prefix && !check_hle ())
4829     return;
4830
4831   /* Check BND prefix.  */
4832   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4833     as_bad (_("expecting valid branch instruction after `bnd'"));
4834
4835   /* Check NOTRACK prefix.  */
4836   if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
4837     as_bad (_("expecting indirect branch instruction after `notrack'"));
4838
4839   if (i.tm.cpu_flags.bitfield.cpumpx)
4840     {
4841       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4842         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4843       else if (flag_code != CODE_16BIT
4844                ? i.prefix[ADDR_PREFIX]
4845                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4846         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4847     }
4848
4849   /* Insert BND prefix.  */
4850   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4851     {
4852       if (!i.prefix[BND_PREFIX])
4853         add_prefix (BND_PREFIX_OPCODE);
4854       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4855         {
4856           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4857           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4858         }
4859     }
4860
4861   /* Check string instruction segment overrides.  */
4862   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4863     {
4864       gas_assert (i.mem_operands);
4865       if (!check_string ())
4866         return;
4867       i.disp_operands = 0;
4868     }
4869
4870   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4871     optimize_encoding ();
4872
4873   if (!process_suffix ())
4874     return;
4875
4876   /* Update operand types and check extended states.  */
4877   for (j = 0; j < i.operands; j++)
4878     {
4879       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4880       switch (i.tm.operand_types[j].bitfield.class)
4881         {
4882         default:
4883           break;
4884         case RegMMX:
4885           i.xstate |= xstate_mmx;
4886           break;
4887         case RegMask:
4888           i.xstate |= xstate_mask;
4889           break;
4890         case RegSIMD:
4891           if (i.tm.operand_types[j].bitfield.tmmword)
4892             i.xstate |= xstate_tmm;
4893           else if (i.tm.operand_types[j].bitfield.zmmword)
4894             i.xstate |= xstate_zmm;
4895           else if (i.tm.operand_types[j].bitfield.ymmword)
4896             i.xstate |= xstate_ymm;
4897           else if (i.tm.operand_types[j].bitfield.xmmword)
4898             i.xstate |= xstate_xmm;
4899           break;
4900         }
4901     }
4902
4903   /* Make still unresolved immediate matches conform to size of immediate
4904      given in i.suffix.  */
4905   if (!finalize_imm ())
4906     return;
4907
4908   if (i.types[0].bitfield.imm1)
4909     i.imm_operands = 0; /* kludge for shift insns.  */
4910
4911   /* We only need to check those implicit registers for instructions
4912      with 3 operands or less.  */
4913   if (i.operands <= 3)
4914     for (j = 0; j < i.operands; j++)
4915       if (i.types[j].bitfield.instance != InstanceNone
4916           && !i.types[j].bitfield.xmmword)
4917         i.reg_operands--;
4918
4919   /* For insns with operands there are more diddles to do to the opcode.  */
4920   if (i.operands)
4921     {
4922       if (!process_operands ())
4923         return;
4924     }
4925   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4926     {
4927       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4928       as_warn (_("translating to `%sp'"), i.tm.name);
4929     }
4930
4931   if (is_any_vex_encoding (&i.tm))
4932     {
4933       if (!cpu_arch_flags.bitfield.cpui286)
4934         {
4935           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4936                   i.tm.name);
4937           return;
4938         }
4939
4940       /* Check for explicit REX prefix.  */
4941       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4942         {
4943           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4944           return;
4945         }
4946
4947       if (i.tm.opcode_modifier.vex)
4948         build_vex_prefix (t);
4949       else
4950         build_evex_prefix ();
4951
4952       /* The individual REX.RXBW bits got consumed.  */
4953       i.rex &= REX_OPCODE;
4954     }
4955
4956   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4957      instructions may define INT_OPCODE as well, so avoid this corner
4958      case for those instructions that use MODRM.  */
4959   if (i.tm.base_opcode == INT_OPCODE
4960       && !i.tm.opcode_modifier.modrm
4961       && i.op[0].imms->X_add_number == 3)
4962     {
4963       i.tm.base_opcode = INT3_OPCODE;
4964       i.imm_operands = 0;
4965     }
4966
4967   if ((i.tm.opcode_modifier.jump == JUMP
4968        || i.tm.opcode_modifier.jump == JUMP_BYTE
4969        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4970       && i.op[0].disps->X_op == O_constant)
4971     {
4972       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4973          the absolute address given by the constant.  Since ix86 jumps and
4974          calls are pc relative, we need to generate a reloc.  */
4975       i.op[0].disps->X_add_symbol = &abs_symbol;
4976       i.op[0].disps->X_op = O_symbol;
4977     }
4978
4979   /* For 8 bit registers we need an empty rex prefix.  Also if the
4980      instruction already has a prefix, we need to convert old
4981      registers to new ones.  */
4982
4983   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4984        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4985       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4986           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4987       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4988            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4989           && i.rex != 0))
4990     {
4991       int x;
4992
4993       i.rex |= REX_OPCODE;
4994       for (x = 0; x < 2; x++)
4995         {
4996           /* Look for 8 bit operand that uses old registers.  */
4997           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4998               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4999             {
5000               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5001               /* In case it is "hi" register, give up.  */
5002               if (i.op[x].regs->reg_num > 3)
5003                 as_bad (_("can't encode register '%s%s' in an "
5004                           "instruction requiring REX prefix."),
5005                         register_prefix, i.op[x].regs->reg_name);
5006
5007               /* Otherwise it is equivalent to the extended register.
5008                  Since the encoding doesn't change this is merely
5009                  cosmetic cleanup for debug output.  */
5010
5011               i.op[x].regs = i.op[x].regs + 8;
5012             }
5013         }
5014     }
5015
5016   if (i.rex == 0 && i.rex_encoding)
5017     {
5018       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
5019          that uses legacy register.  If it is "hi" register, don't add
5020          the REX_OPCODE byte.  */
5021       int x;
5022       for (x = 0; x < 2; x++)
5023         if (i.types[x].bitfield.class == Reg
5024             && i.types[x].bitfield.byte
5025             && (i.op[x].regs->reg_flags & RegRex64) == 0
5026             && i.op[x].regs->reg_num > 3)
5027           {
5028             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5029             i.rex_encoding = FALSE;
5030             break;
5031           }
5032
5033       if (i.rex_encoding)
5034         i.rex = REX_OPCODE;
5035     }
5036
5037   if (i.rex != 0)
5038     add_prefix (REX_OPCODE | i.rex);
5039
5040   insert_lfence_before ();
5041
5042   /* We are ready to output the insn.  */
5043   output_insn ();
5044
5045   insert_lfence_after ();
5046
5047   last_insn.seg = now_seg;
5048
5049   if (i.tm.opcode_modifier.isprefix)
5050     {
5051       last_insn.kind = last_insn_prefix;
5052       last_insn.name = i.tm.name;
5053       last_insn.file = as_where (&last_insn.line);
5054     }
5055   else
5056     last_insn.kind = last_insn_other;
5057 }
5058
5059 static char *
5060 parse_insn (char *line, char *mnemonic)
5061 {
5062   char *l = line;
5063   char *token_start = l;
5064   char *mnem_p;
5065   int supported;
5066   const insn_template *t;
5067   char *dot_p = NULL;
5068
5069   while (1)
5070     {
5071       mnem_p = mnemonic;
5072       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5073         {
5074           if (*mnem_p == '.')
5075             dot_p = mnem_p;
5076           mnem_p++;
5077           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5078             {
5079               as_bad (_("no such instruction: `%s'"), token_start);
5080               return NULL;
5081             }
5082           l++;
5083         }
5084       if (!is_space_char (*l)
5085           && *l != END_OF_INSN
5086           && (intel_syntax
5087               || (*l != PREFIX_SEPARATOR
5088                   && *l != ',')))
5089         {
5090           as_bad (_("invalid character %s in mnemonic"),
5091                   output_invalid (*l));
5092           return NULL;
5093         }
5094       if (token_start == l)
5095         {
5096           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5097             as_bad (_("expecting prefix; got nothing"));
5098           else
5099             as_bad (_("expecting mnemonic; got nothing"));
5100           return NULL;
5101         }
5102
5103       /* Look up instruction (or prefix) via hash table.  */
5104       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5105
5106       if (*l != END_OF_INSN
5107           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5108           && current_templates
5109           && current_templates->start->opcode_modifier.isprefix)
5110         {
5111           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5112             {
5113               as_bad ((flag_code != CODE_64BIT
5114                        ? _("`%s' is only supported in 64-bit mode")
5115                        : _("`%s' is not supported in 64-bit mode")),
5116                       current_templates->start->name);
5117               return NULL;
5118             }
5119           /* If we are in 16-bit mode, do not allow addr16 or data16.
5120              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5121           if ((current_templates->start->opcode_modifier.size == SIZE16
5122                || current_templates->start->opcode_modifier.size == SIZE32)
5123               && flag_code != CODE_64BIT
5124               && ((current_templates->start->opcode_modifier.size == SIZE32)
5125                   ^ (flag_code == CODE_16BIT)))
5126             {
5127               as_bad (_("redundant %s prefix"),
5128                       current_templates->start->name);
5129               return NULL;
5130             }
5131           if (current_templates->start->opcode_length == 0)
5132             {
5133               /* Handle pseudo prefixes.  */
5134               switch (current_templates->start->base_opcode)
5135                 {
5136                 case Prefix_Disp8:
5137                   /* {disp8} */
5138                   i.disp_encoding = disp_encoding_8bit;
5139                   break;
5140                 case Prefix_Disp16:
5141                   /* {disp16} */
5142                   i.disp_encoding = disp_encoding_16bit;
5143                   break;
5144                 case Prefix_Disp32:
5145                   /* {disp32} */
5146                   i.disp_encoding = disp_encoding_32bit;
5147                   break;
5148                 case Prefix_Load:
5149                   /* {load} */
5150                   i.dir_encoding = dir_encoding_load;
5151                   break;
5152                 case Prefix_Store:
5153                   /* {store} */
5154                   i.dir_encoding = dir_encoding_store;
5155                   break;
5156                 case Prefix_VEX:
5157                   /* {vex} */
5158                   i.vec_encoding = vex_encoding_vex;
5159                   break;
5160                 case Prefix_VEX3:
5161                   /* {vex3} */
5162                   i.vec_encoding = vex_encoding_vex3;
5163                   break;
5164                 case Prefix_EVEX:
5165                   /* {evex} */
5166                   i.vec_encoding = vex_encoding_evex;
5167                   break;
5168                 case Prefix_REX:
5169                   /* {rex} */
5170                   i.rex_encoding = TRUE;
5171                   break;
5172                 case Prefix_NoOptimize:
5173                   /* {nooptimize} */
5174                   i.no_optimize = TRUE;
5175                   break;
5176                 default:
5177                   abort ();
5178                 }
5179             }
5180           else
5181             {
5182               /* Add prefix, checking for repeated prefixes.  */
5183               switch (add_prefix (current_templates->start->base_opcode))
5184                 {
5185                 case PREFIX_EXIST:
5186                   return NULL;
5187                 case PREFIX_DS:
5188                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5189                     i.notrack_prefix = current_templates->start->name;
5190                   break;
5191                 case PREFIX_REP:
5192                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5193                     i.hle_prefix = current_templates->start->name;
5194                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5195                     i.bnd_prefix = current_templates->start->name;
5196                   else
5197                     i.rep_prefix = current_templates->start->name;
5198                   break;
5199                 default:
5200                   break;
5201                 }
5202             }
5203           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5204           token_start = ++l;
5205         }
5206       else
5207         break;
5208     }
5209
5210   if (!current_templates)
5211     {
5212       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5213          Check if we should swap operand or force 32bit displacement in
5214          encoding.  */
5215       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5216         i.dir_encoding = dir_encoding_swap;
5217       else if (mnem_p - 3 == dot_p
5218                && dot_p[1] == 'd'
5219                && dot_p[2] == '8')
5220         i.disp_encoding = disp_encoding_8bit;
5221       else if (mnem_p - 4 == dot_p
5222                && dot_p[1] == 'd'
5223                && dot_p[2] == '3'
5224                && dot_p[3] == '2')
5225         i.disp_encoding = disp_encoding_32bit;
5226       else
5227         goto check_suffix;
5228       mnem_p = dot_p;
5229       *dot_p = '\0';
5230       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5231     }
5232
5233   if (!current_templates)
5234     {
5235     check_suffix:
5236       if (mnem_p > mnemonic)
5237         {
5238           /* See if we can get a match by trimming off a suffix.  */
5239           switch (mnem_p[-1])
5240             {
5241             case WORD_MNEM_SUFFIX:
5242               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5243                 i.suffix = SHORT_MNEM_SUFFIX;
5244               else
5245                 /* Fall through.  */
5246               case BYTE_MNEM_SUFFIX:
5247               case QWORD_MNEM_SUFFIX:
5248                 i.suffix = mnem_p[-1];
5249               mnem_p[-1] = '\0';
5250               current_templates
5251                 = (const templates *) str_hash_find (op_hash, mnemonic);
5252               break;
5253             case SHORT_MNEM_SUFFIX:
5254             case LONG_MNEM_SUFFIX:
5255               if (!intel_syntax)
5256                 {
5257                   i.suffix = mnem_p[-1];
5258                   mnem_p[-1] = '\0';
5259                   current_templates
5260                     = (const templates *) str_hash_find (op_hash, mnemonic);
5261                 }
5262               break;
5263
5264               /* Intel Syntax.  */
5265             case 'd':
5266               if (intel_syntax)
5267                 {
5268                   if (intel_float_operand (mnemonic) == 1)
5269                     i.suffix = SHORT_MNEM_SUFFIX;
5270                   else
5271                     i.suffix = LONG_MNEM_SUFFIX;
5272                   mnem_p[-1] = '\0';
5273                   current_templates
5274                     = (const templates *) str_hash_find (op_hash, mnemonic);
5275                 }
5276               break;
5277             }
5278         }
5279
5280       if (!current_templates)
5281         {
5282           as_bad (_("no such instruction: `%s'"), token_start);
5283           return NULL;
5284         }
5285     }
5286
5287   if (current_templates->start->opcode_modifier.jump == JUMP
5288       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5289     {
5290       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5291          predict taken and predict not taken respectively.
5292          I'm not sure that branch hints actually do anything on loop
5293          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5294          may work in the future and it doesn't hurt to accept them
5295          now.  */
5296       if (l[0] == ',' && l[1] == 'p')
5297         {
5298           if (l[2] == 't')
5299             {
5300               if (!add_prefix (DS_PREFIX_OPCODE))
5301                 return NULL;
5302               l += 3;
5303             }
5304           else if (l[2] == 'n')
5305             {
5306               if (!add_prefix (CS_PREFIX_OPCODE))
5307                 return NULL;
5308               l += 3;
5309             }
5310         }
5311     }
5312   /* Any other comma loses.  */
5313   if (*l == ',')
5314     {
5315       as_bad (_("invalid character %s in mnemonic"),
5316               output_invalid (*l));
5317       return NULL;
5318     }
5319
5320   /* Check if instruction is supported on specified architecture.  */
5321   supported = 0;
5322   for (t = current_templates->start; t < current_templates->end; ++t)
5323     {
5324       supported |= cpu_flags_match (t);
5325       if (supported == CPU_FLAGS_PERFECT_MATCH)
5326         {
5327           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5328             as_warn (_("use .code16 to ensure correct addressing mode"));
5329
5330           return l;
5331         }
5332     }
5333
5334   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5335     as_bad (flag_code == CODE_64BIT
5336             ? _("`%s' is not supported in 64-bit mode")
5337             : _("`%s' is only supported in 64-bit mode"),
5338             current_templates->start->name);
5339   else
5340     as_bad (_("`%s' is not supported on `%s%s'"),
5341             current_templates->start->name,
5342             cpu_arch_name ? cpu_arch_name : default_arch,
5343             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5344
5345   return NULL;
5346 }
5347
5348 static char *
5349 parse_operands (char *l, const char *mnemonic)
5350 {
5351   char *token_start;
5352
5353   /* 1 if operand is pending after ','.  */
5354   unsigned int expecting_operand = 0;
5355
5356   /* Non-zero if operand parens not balanced.  */
5357   unsigned int paren_not_balanced;
5358
5359   while (*l != END_OF_INSN)
5360     {
5361       /* Skip optional white space before operand.  */
5362       if (is_space_char (*l))
5363         ++l;
5364       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5365         {
5366           as_bad (_("invalid character %s before operand %d"),
5367                   output_invalid (*l),
5368                   i.operands + 1);
5369           return NULL;
5370         }
5371       token_start = l;  /* After white space.  */
5372       paren_not_balanced = 0;
5373       while (paren_not_balanced || *l != ',')
5374         {
5375           if (*l == END_OF_INSN)
5376             {
5377               if (paren_not_balanced)
5378                 {
5379                   if (!intel_syntax)
5380                     as_bad (_("unbalanced parenthesis in operand %d."),
5381                             i.operands + 1);
5382                   else
5383                     as_bad (_("unbalanced brackets in operand %d."),
5384                             i.operands + 1);
5385                   return NULL;
5386                 }
5387               else
5388                 break;  /* we are done */
5389             }
5390           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5391             {
5392               as_bad (_("invalid character %s in operand %d"),
5393                       output_invalid (*l),
5394                       i.operands + 1);
5395               return NULL;
5396             }
5397           if (!intel_syntax)
5398             {
5399               if (*l == '(')
5400                 ++paren_not_balanced;
5401               if (*l == ')')
5402                 --paren_not_balanced;
5403             }
5404           else
5405             {
5406               if (*l == '[')
5407                 ++paren_not_balanced;
5408               if (*l == ']')
5409                 --paren_not_balanced;
5410             }
5411           l++;
5412         }
5413       if (l != token_start)
5414         {                       /* Yes, we've read in another operand.  */
5415           unsigned int operand_ok;
5416           this_operand = i.operands++;
5417           if (i.operands > MAX_OPERANDS)
5418             {
5419               as_bad (_("spurious operands; (%d operands/instruction max)"),
5420                       MAX_OPERANDS);
5421               return NULL;
5422             }
5423           i.types[this_operand].bitfield.unspecified = 1;
5424           /* Now parse operand adding info to 'i' as we go along.  */
5425           END_STRING_AND_SAVE (l);
5426
5427           if (i.mem_operands > 1)
5428             {
5429               as_bad (_("too many memory references for `%s'"),
5430                       mnemonic);
5431               return 0;
5432             }
5433
5434           if (intel_syntax)
5435             operand_ok =
5436               i386_intel_operand (token_start,
5437                                   intel_float_operand (mnemonic));
5438           else
5439             operand_ok = i386_att_operand (token_start);
5440
5441           RESTORE_END_STRING (l);
5442           if (!operand_ok)
5443             return NULL;
5444         }
5445       else
5446         {
5447           if (expecting_operand)
5448             {
5449             expecting_operand_after_comma:
5450               as_bad (_("expecting operand after ','; got nothing"));
5451               return NULL;
5452             }
5453           if (*l == ',')
5454             {
5455               as_bad (_("expecting operand before ','; got nothing"));
5456               return NULL;
5457             }
5458         }
5459
5460       /* Now *l must be either ',' or END_OF_INSN.  */
5461       if (*l == ',')
5462         {
5463           if (*++l == END_OF_INSN)
5464             {
5465               /* Just skip it, if it's \n complain.  */
5466               goto expecting_operand_after_comma;
5467             }
5468           expecting_operand = 1;
5469         }
5470     }
5471   return l;
5472 }
5473
5474 static void
5475 swap_2_operands (int xchg1, int xchg2)
5476 {
5477   union i386_op temp_op;
5478   i386_operand_type temp_type;
5479   unsigned int temp_flags;
5480   enum bfd_reloc_code_real temp_reloc;
5481
5482   temp_type = i.types[xchg2];
5483   i.types[xchg2] = i.types[xchg1];
5484   i.types[xchg1] = temp_type;
5485
5486   temp_flags = i.flags[xchg2];
5487   i.flags[xchg2] = i.flags[xchg1];
5488   i.flags[xchg1] = temp_flags;
5489
5490   temp_op = i.op[xchg2];
5491   i.op[xchg2] = i.op[xchg1];
5492   i.op[xchg1] = temp_op;
5493
5494   temp_reloc = i.reloc[xchg2];
5495   i.reloc[xchg2] = i.reloc[xchg1];
5496   i.reloc[xchg1] = temp_reloc;
5497
5498   if (i.mask)
5499     {
5500       if (i.mask->operand == xchg1)
5501         i.mask->operand = xchg2;
5502       else if (i.mask->operand == xchg2)
5503         i.mask->operand = xchg1;
5504     }
5505   if (i.broadcast)
5506     {
5507       if (i.broadcast->operand == xchg1)
5508         i.broadcast->operand = xchg2;
5509       else if (i.broadcast->operand == xchg2)
5510         i.broadcast->operand = xchg1;
5511     }
5512   if (i.rounding)
5513     {
5514       if (i.rounding->operand == xchg1)
5515         i.rounding->operand = xchg2;
5516       else if (i.rounding->operand == xchg2)
5517         i.rounding->operand = xchg1;
5518     }
5519 }
5520
5521 static void
5522 swap_operands (void)
5523 {
5524   switch (i.operands)
5525     {
5526     case 5:
5527     case 4:
5528       swap_2_operands (1, i.operands - 2);
5529       /* Fall through.  */
5530     case 3:
5531     case 2:
5532       swap_2_operands (0, i.operands - 1);
5533       break;
5534     default:
5535       abort ();
5536     }
5537
5538   if (i.mem_operands == 2)
5539     {
5540       const seg_entry *temp_seg;
5541       temp_seg = i.seg[0];
5542       i.seg[0] = i.seg[1];
5543       i.seg[1] = temp_seg;
5544     }
5545 }
5546
5547 /* Try to ensure constant immediates are represented in the smallest
5548    opcode possible.  */
5549 static void
5550 optimize_imm (void)
5551 {
5552   char guess_suffix = 0;
5553   int op;
5554
5555   if (i.suffix)
5556     guess_suffix = i.suffix;
5557   else if (i.reg_operands)
5558     {
5559       /* Figure out a suffix from the last register operand specified.
5560          We can't do this properly yet, i.e. excluding special register
5561          instances, but the following works for instructions with
5562          immediates.  In any case, we can't set i.suffix yet.  */
5563       for (op = i.operands; --op >= 0;)
5564         if (i.types[op].bitfield.class != Reg)
5565           continue;
5566         else if (i.types[op].bitfield.byte)
5567           {
5568             guess_suffix = BYTE_MNEM_SUFFIX;
5569             break;
5570           }
5571         else if (i.types[op].bitfield.word)
5572           {
5573             guess_suffix = WORD_MNEM_SUFFIX;
5574             break;
5575           }
5576         else if (i.types[op].bitfield.dword)
5577           {
5578             guess_suffix = LONG_MNEM_SUFFIX;
5579             break;
5580           }
5581         else if (i.types[op].bitfield.qword)
5582           {
5583             guess_suffix = QWORD_MNEM_SUFFIX;
5584             break;
5585           }
5586     }
5587   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5588     guess_suffix = WORD_MNEM_SUFFIX;
5589
5590   for (op = i.operands; --op >= 0;)
5591     if (operand_type_check (i.types[op], imm))
5592       {
5593         switch (i.op[op].imms->X_op)
5594           {
5595           case O_constant:
5596             /* If a suffix is given, this operand may be shortened.  */
5597             switch (guess_suffix)
5598               {
5599               case LONG_MNEM_SUFFIX:
5600                 i.types[op].bitfield.imm32 = 1;
5601                 i.types[op].bitfield.imm64 = 1;
5602                 break;
5603               case WORD_MNEM_SUFFIX:
5604                 i.types[op].bitfield.imm16 = 1;
5605                 i.types[op].bitfield.imm32 = 1;
5606                 i.types[op].bitfield.imm32s = 1;
5607                 i.types[op].bitfield.imm64 = 1;
5608                 break;
5609               case BYTE_MNEM_SUFFIX:
5610                 i.types[op].bitfield.imm8 = 1;
5611                 i.types[op].bitfield.imm8s = 1;
5612                 i.types[op].bitfield.imm16 = 1;
5613                 i.types[op].bitfield.imm32 = 1;
5614                 i.types[op].bitfield.imm32s = 1;
5615                 i.types[op].bitfield.imm64 = 1;
5616                 break;
5617               }
5618
5619             /* If this operand is at most 16 bits, convert it
5620                to a signed 16 bit number before trying to see
5621                whether it will fit in an even smaller size.
5622                This allows a 16-bit operand such as $0xffe0 to
5623                be recognised as within Imm8S range.  */
5624             if ((i.types[op].bitfield.imm16)
5625                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5626               {
5627                 i.op[op].imms->X_add_number =
5628                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5629               }
5630 #ifdef BFD64
5631             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5632             if ((i.types[op].bitfield.imm32)
5633                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5634                     == 0))
5635               {
5636                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5637                                                 ^ ((offsetT) 1 << 31))
5638                                                - ((offsetT) 1 << 31));
5639               }
5640 #endif
5641             i.types[op]
5642               = operand_type_or (i.types[op],
5643                                  smallest_imm_type (i.op[op].imms->X_add_number));
5644
5645             /* We must avoid matching of Imm32 templates when 64bit
5646                only immediate is available.  */
5647             if (guess_suffix == QWORD_MNEM_SUFFIX)
5648               i.types[op].bitfield.imm32 = 0;
5649             break;
5650
5651           case O_absent:
5652           case O_register:
5653             abort ();
5654
5655             /* Symbols and expressions.  */
5656           default:
5657             /* Convert symbolic operand to proper sizes for matching, but don't
5658                prevent matching a set of insns that only supports sizes other
5659                than those matching the insn suffix.  */
5660             {
5661               i386_operand_type mask, allowed;
5662               const insn_template *t;
5663
5664               operand_type_set (&mask, 0);
5665               operand_type_set (&allowed, 0);
5666
5667               for (t = current_templates->start;
5668                    t < current_templates->end;
5669                    ++t)
5670                 {
5671                   allowed = operand_type_or (allowed, t->operand_types[op]);
5672                   allowed = operand_type_and (allowed, anyimm);
5673                 }
5674               switch (guess_suffix)
5675                 {
5676                 case QWORD_MNEM_SUFFIX:
5677                   mask.bitfield.imm64 = 1;
5678                   mask.bitfield.imm32s = 1;
5679                   break;
5680                 case LONG_MNEM_SUFFIX:
5681                   mask.bitfield.imm32 = 1;
5682                   break;
5683                 case WORD_MNEM_SUFFIX:
5684                   mask.bitfield.imm16 = 1;
5685                   break;
5686                 case BYTE_MNEM_SUFFIX:
5687                   mask.bitfield.imm8 = 1;
5688                   break;
5689                 default:
5690                   break;
5691                 }
5692               allowed = operand_type_and (mask, allowed);
5693               if (!operand_type_all_zero (&allowed))
5694                 i.types[op] = operand_type_and (i.types[op], mask);
5695             }
5696             break;
5697           }
5698       }
5699 }
5700
5701 /* Try to use the smallest displacement type too.  */
5702 static void
5703 optimize_disp (void)
5704 {
5705   int op;
5706
5707   for (op = i.operands; --op >= 0;)
5708     if (operand_type_check (i.types[op], disp))
5709       {
5710         if (i.op[op].disps->X_op == O_constant)
5711           {
5712             offsetT op_disp = i.op[op].disps->X_add_number;
5713
5714             if (i.types[op].bitfield.disp16
5715                 && (op_disp & ~(offsetT) 0xffff) == 0)
5716               {
5717                 /* If this operand is at most 16 bits, convert
5718                    to a signed 16 bit number and don't use 64bit
5719                    displacement.  */
5720                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5721                 i.types[op].bitfield.disp64 = 0;
5722               }
5723 #ifdef BFD64
5724             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5725             if (i.types[op].bitfield.disp32
5726                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5727               {
5728                 /* If this operand is at most 32 bits, convert
5729                    to a signed 32 bit number and don't use 64bit
5730                    displacement.  */
5731                 op_disp &= (((offsetT) 2 << 31) - 1);
5732                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5733                 i.types[op].bitfield.disp64 = 0;
5734               }
5735 #endif
5736             if (!op_disp && i.types[op].bitfield.baseindex)
5737               {
5738                 i.types[op].bitfield.disp8 = 0;
5739                 i.types[op].bitfield.disp16 = 0;
5740                 i.types[op].bitfield.disp32 = 0;
5741                 i.types[op].bitfield.disp32s = 0;
5742                 i.types[op].bitfield.disp64 = 0;
5743                 i.op[op].disps = 0;
5744                 i.disp_operands--;
5745               }
5746             else if (flag_code == CODE_64BIT)
5747               {
5748                 if (fits_in_signed_long (op_disp))
5749                   {
5750                     i.types[op].bitfield.disp64 = 0;
5751                     i.types[op].bitfield.disp32s = 1;
5752                   }
5753                 if (i.prefix[ADDR_PREFIX]
5754                     && fits_in_unsigned_long (op_disp))
5755                   i.types[op].bitfield.disp32 = 1;
5756               }
5757             if ((i.types[op].bitfield.disp32
5758                  || i.types[op].bitfield.disp32s
5759                  || i.types[op].bitfield.disp16)
5760                 && fits_in_disp8 (op_disp))
5761               i.types[op].bitfield.disp8 = 1;
5762           }
5763         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5764                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5765           {
5766             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5767                          i.op[op].disps, 0, i.reloc[op]);
5768             i.types[op].bitfield.disp8 = 0;
5769             i.types[op].bitfield.disp16 = 0;
5770             i.types[op].bitfield.disp32 = 0;
5771             i.types[op].bitfield.disp32s = 0;
5772             i.types[op].bitfield.disp64 = 0;
5773           }
5774         else
5775           /* We only support 64bit displacement on constants.  */
5776           i.types[op].bitfield.disp64 = 0;
5777       }
5778 }
5779
5780 /* Return 1 if there is a match in broadcast bytes between operand
5781    GIVEN and instruction template T.   */
5782
5783 static INLINE int
5784 match_broadcast_size (const insn_template *t, unsigned int given)
5785 {
5786   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5787            && i.types[given].bitfield.byte)
5788           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5789               && i.types[given].bitfield.word)
5790           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5791               && i.types[given].bitfield.dword)
5792           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5793               && i.types[given].bitfield.qword));
5794 }
5795
5796 /* Check if operands are valid for the instruction.  */
5797
5798 static int
5799 check_VecOperands (const insn_template *t)
5800 {
5801   unsigned int op;
5802   i386_cpu_flags cpu;
5803
5804   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5805      any one operand are implicity requiring AVX512VL support if the actual
5806      operand size is YMMword or XMMword.  Since this function runs after
5807      template matching, there's no need to check for YMMword/XMMword in
5808      the template.  */
5809   cpu = cpu_flags_and (t->cpu_flags, avx512);
5810   if (!cpu_flags_all_zero (&cpu)
5811       && !t->cpu_flags.bitfield.cpuavx512vl
5812       && !cpu_arch_flags.bitfield.cpuavx512vl)
5813     {
5814       for (op = 0; op < t->operands; ++op)
5815         {
5816           if (t->operand_types[op].bitfield.zmmword
5817               && (i.types[op].bitfield.ymmword
5818                   || i.types[op].bitfield.xmmword))
5819             {
5820               i.error = unsupported;
5821               return 1;
5822             }
5823         }
5824     }
5825
5826   /* Without VSIB byte, we can't have a vector register for index.  */
5827   if (!t->opcode_modifier.sib
5828       && i.index_reg
5829       && (i.index_reg->reg_type.bitfield.xmmword
5830           || i.index_reg->reg_type.bitfield.ymmword
5831           || i.index_reg->reg_type.bitfield.zmmword))
5832     {
5833       i.error = unsupported_vector_index_register;
5834       return 1;
5835     }
5836
5837   /* Check if default mask is allowed.  */
5838   if (t->opcode_modifier.nodefmask
5839       && (!i.mask || i.mask->mask->reg_num == 0))
5840     {
5841       i.error = no_default_mask;
5842       return 1;
5843     }
5844
5845   /* For VSIB byte, we need a vector register for index, and all vector
5846      registers must be distinct.  */
5847   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5848     {
5849       if (!i.index_reg
5850           || !((t->opcode_modifier.sib == VECSIB128
5851                 && i.index_reg->reg_type.bitfield.xmmword)
5852                || (t->opcode_modifier.sib == VECSIB256
5853                    && i.index_reg->reg_type.bitfield.ymmword)
5854                || (t->opcode_modifier.sib == VECSIB512
5855                    && i.index_reg->reg_type.bitfield.zmmword)))
5856       {
5857         i.error = invalid_vsib_address;
5858         return 1;
5859       }
5860
5861       gas_assert (i.reg_operands == 2 || i.mask);
5862       if (i.reg_operands == 2 && !i.mask)
5863         {
5864           gas_assert (i.types[0].bitfield.class == RegSIMD);
5865           gas_assert (i.types[0].bitfield.xmmword
5866                       || i.types[0].bitfield.ymmword);
5867           gas_assert (i.types[2].bitfield.class == RegSIMD);
5868           gas_assert (i.types[2].bitfield.xmmword
5869                       || i.types[2].bitfield.ymmword);
5870           if (operand_check == check_none)
5871             return 0;
5872           if (register_number (i.op[0].regs)
5873               != register_number (i.index_reg)
5874               && register_number (i.op[2].regs)
5875                  != register_number (i.index_reg)
5876               && register_number (i.op[0].regs)
5877                  != register_number (i.op[2].regs))
5878             return 0;
5879           if (operand_check == check_error)
5880             {
5881               i.error = invalid_vector_register_set;
5882               return 1;
5883             }
5884           as_warn (_("mask, index, and destination registers should be distinct"));
5885         }
5886       else if (i.reg_operands == 1 && i.mask)
5887         {
5888           if (i.types[1].bitfield.class == RegSIMD
5889               && (i.types[1].bitfield.xmmword
5890                   || i.types[1].bitfield.ymmword
5891                   || i.types[1].bitfield.zmmword)
5892               && (register_number (i.op[1].regs)
5893                   == register_number (i.index_reg)))
5894             {
5895               if (operand_check == check_error)
5896                 {
5897                   i.error = invalid_vector_register_set;
5898                   return 1;
5899                 }
5900               if (operand_check != check_none)
5901                 as_warn (_("index and destination registers should be distinct"));
5902             }
5903         }
5904     }
5905
5906   /* For AMX instructions with three tmmword operands, all tmmword operand must be
5907      distinct */
5908   if (t->operand_types[0].bitfield.tmmword
5909       && i.reg_operands == 3)
5910     {
5911       if (register_number (i.op[0].regs)
5912           == register_number (i.op[1].regs)
5913           || register_number (i.op[0].regs)
5914              == register_number (i.op[2].regs)
5915           || register_number (i.op[1].regs)
5916              == register_number (i.op[2].regs))
5917         {
5918           i.error = invalid_tmm_register_set;
5919           return 1;
5920         }
5921     }
5922
5923   /* Check if broadcast is supported by the instruction and is applied
5924      to the memory operand.  */
5925   if (i.broadcast)
5926     {
5927       i386_operand_type type, overlap;
5928
5929       /* Check if specified broadcast is supported in this instruction,
5930          and its broadcast bytes match the memory operand.  */
5931       op = i.broadcast->operand;
5932       if (!t->opcode_modifier.broadcast
5933           || !(i.flags[op] & Operand_Mem)
5934           || (!i.types[op].bitfield.unspecified
5935               && !match_broadcast_size (t, op)))
5936         {
5937         bad_broadcast:
5938           i.error = unsupported_broadcast;
5939           return 1;
5940         }
5941
5942       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5943                             * i.broadcast->type);
5944       operand_type_set (&type, 0);
5945       switch (i.broadcast->bytes)
5946         {
5947         case 2:
5948           type.bitfield.word = 1;
5949           break;
5950         case 4:
5951           type.bitfield.dword = 1;
5952           break;
5953         case 8:
5954           type.bitfield.qword = 1;
5955           break;
5956         case 16:
5957           type.bitfield.xmmword = 1;
5958           break;
5959         case 32:
5960           type.bitfield.ymmword = 1;
5961           break;
5962         case 64:
5963           type.bitfield.zmmword = 1;
5964           break;
5965         default:
5966           goto bad_broadcast;
5967         }
5968
5969       overlap = operand_type_and (type, t->operand_types[op]);
5970       if (t->operand_types[op].bitfield.class == RegSIMD
5971           && t->operand_types[op].bitfield.byte
5972              + t->operand_types[op].bitfield.word
5973              + t->operand_types[op].bitfield.dword
5974              + t->operand_types[op].bitfield.qword > 1)
5975         {
5976           overlap.bitfield.xmmword = 0;
5977           overlap.bitfield.ymmword = 0;
5978           overlap.bitfield.zmmword = 0;
5979         }
5980       if (operand_type_all_zero (&overlap))
5981           goto bad_broadcast;
5982
5983       if (t->opcode_modifier.checkregsize)
5984         {
5985           unsigned int j;
5986
5987           type.bitfield.baseindex = 1;
5988           for (j = 0; j < i.operands; ++j)
5989             {
5990               if (j != op
5991                   && !operand_type_register_match(i.types[j],
5992                                                   t->operand_types[j],
5993                                                   type,
5994                                                   t->operand_types[op]))
5995                 goto bad_broadcast;
5996             }
5997         }
5998     }
5999   /* If broadcast is supported in this instruction, we need to check if
6000      operand of one-element size isn't specified without broadcast.  */
6001   else if (t->opcode_modifier.broadcast && i.mem_operands)
6002     {
6003       /* Find memory operand.  */
6004       for (op = 0; op < i.operands; op++)
6005         if (i.flags[op] & Operand_Mem)
6006           break;
6007       gas_assert (op < i.operands);
6008       /* Check size of the memory operand.  */
6009       if (match_broadcast_size (t, op))
6010         {
6011           i.error = broadcast_needed;
6012           return 1;
6013         }
6014     }
6015   else
6016     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
6017
6018   /* Check if requested masking is supported.  */
6019   if (i.mask)
6020     {
6021       switch (t->opcode_modifier.masking)
6022         {
6023         case BOTH_MASKING:
6024           break;
6025         case MERGING_MASKING:
6026           if (i.mask->zeroing)
6027             {
6028         case 0:
6029               i.error = unsupported_masking;
6030               return 1;
6031             }
6032           break;
6033         case DYNAMIC_MASKING:
6034           /* Memory destinations allow only merging masking.  */
6035           if (i.mask->zeroing && i.mem_operands)
6036             {
6037               /* Find memory operand.  */
6038               for (op = 0; op < i.operands; op++)
6039                 if (i.flags[op] & Operand_Mem)
6040                   break;
6041               gas_assert (op < i.operands);
6042               if (op == i.operands - 1)
6043                 {
6044                   i.error = unsupported_masking;
6045                   return 1;
6046                 }
6047             }
6048           break;
6049         default:
6050           abort ();
6051         }
6052     }
6053
6054   /* Check if masking is applied to dest operand.  */
6055   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6056     {
6057       i.error = mask_not_on_destination;
6058       return 1;
6059     }
6060
6061   /* Check RC/SAE.  */
6062   if (i.rounding)
6063     {
6064       if (!t->opcode_modifier.sae
6065           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6066         {
6067           i.error = unsupported_rc_sae;
6068           return 1;
6069         }
6070       /* If the instruction has several immediate operands and one of
6071          them is rounding, the rounding operand should be the last
6072          immediate operand.  */
6073       if (i.imm_operands > 1
6074           && i.rounding->operand != (int) (i.imm_operands - 1))
6075         {
6076           i.error = rc_sae_operand_not_last_imm;
6077           return 1;
6078         }
6079     }
6080
6081   /* Check the special Imm4 cases; must be the first operand.  */
6082   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6083     {
6084       if (i.op[0].imms->X_op != O_constant
6085           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6086         {
6087           i.error = bad_imm4;
6088           return 1;
6089         }
6090
6091       /* Turn off Imm<N> so that update_imm won't complain.  */
6092       operand_type_set (&i.types[0], 0);
6093     }
6094
6095   /* Check vector Disp8 operand.  */
6096   if (t->opcode_modifier.disp8memshift
6097       && i.disp_encoding != disp_encoding_32bit)
6098     {
6099       if (i.broadcast)
6100         i.memshift = t->opcode_modifier.broadcast - 1;
6101       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6102         i.memshift = t->opcode_modifier.disp8memshift;
6103       else
6104         {
6105           const i386_operand_type *type = NULL;
6106
6107           i.memshift = 0;
6108           for (op = 0; op < i.operands; op++)
6109             if (i.flags[op] & Operand_Mem)
6110               {
6111                 if (t->opcode_modifier.evex == EVEXLIG)
6112                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6113                 else if (t->operand_types[op].bitfield.xmmword
6114                          + t->operand_types[op].bitfield.ymmword
6115                          + t->operand_types[op].bitfield.zmmword <= 1)
6116                   type = &t->operand_types[op];
6117                 else if (!i.types[op].bitfield.unspecified)
6118                   type = &i.types[op];
6119               }
6120             else if (i.types[op].bitfield.class == RegSIMD
6121                      && t->opcode_modifier.evex != EVEXLIG)
6122               {
6123                 if (i.types[op].bitfield.zmmword)
6124                   i.memshift = 6;
6125                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6126                   i.memshift = 5;
6127                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6128                   i.memshift = 4;
6129               }
6130
6131           if (type)
6132             {
6133               if (type->bitfield.zmmword)
6134                 i.memshift = 6;
6135               else if (type->bitfield.ymmword)
6136                 i.memshift = 5;
6137               else if (type->bitfield.xmmword)
6138                 i.memshift = 4;
6139             }
6140
6141           /* For the check in fits_in_disp8().  */
6142           if (i.memshift == 0)
6143             i.memshift = -1;
6144         }
6145
6146       for (op = 0; op < i.operands; op++)
6147         if (operand_type_check (i.types[op], disp)
6148             && i.op[op].disps->X_op == O_constant)
6149           {
6150             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6151               {
6152                 i.types[op].bitfield.disp8 = 1;
6153                 return 0;
6154               }
6155             i.types[op].bitfield.disp8 = 0;
6156           }
6157     }
6158
6159   i.memshift = 0;
6160
6161   return 0;
6162 }
6163
6164 /* Check if encoding requirements are met by the instruction.  */
6165
6166 static int
6167 VEX_check_encoding (const insn_template *t)
6168 {
6169   if (i.vec_encoding == vex_encoding_error)
6170     {
6171       i.error = unsupported;
6172       return 1;
6173     }
6174
6175   if (i.vec_encoding == vex_encoding_evex)
6176     {
6177       /* This instruction must be encoded with EVEX prefix.  */
6178       if (!is_evex_encoding (t))
6179         {
6180           i.error = unsupported;
6181           return 1;
6182         }
6183       return 0;
6184     }
6185
6186   if (!t->opcode_modifier.vex)
6187     {
6188       /* This instruction template doesn't have VEX prefix.  */
6189       if (i.vec_encoding != vex_encoding_default)
6190         {
6191           i.error = unsupported;
6192           return 1;
6193         }
6194       return 0;
6195     }
6196
6197   return 0;
6198 }
6199
6200 static const insn_template *
6201 match_template (char mnem_suffix)
6202 {
6203   /* Points to template once we've found it.  */
6204   const insn_template *t;
6205   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6206   i386_operand_type overlap4;
6207   unsigned int found_reverse_match;
6208   i386_opcode_modifier suffix_check;
6209   i386_operand_type operand_types [MAX_OPERANDS];
6210   int addr_prefix_disp;
6211   unsigned int j, size_match, check_register;
6212   enum i386_error specific_error = 0;
6213
6214 #if MAX_OPERANDS != 5
6215 # error "MAX_OPERANDS must be 5."
6216 #endif
6217
6218   found_reverse_match = 0;
6219   addr_prefix_disp = -1;
6220
6221   /* Prepare for mnemonic suffix check.  */
6222   memset (&suffix_check, 0, sizeof (suffix_check));
6223   switch (mnem_suffix)
6224     {
6225     case BYTE_MNEM_SUFFIX:
6226       suffix_check.no_bsuf = 1;
6227       break;
6228     case WORD_MNEM_SUFFIX:
6229       suffix_check.no_wsuf = 1;
6230       break;
6231     case SHORT_MNEM_SUFFIX:
6232       suffix_check.no_ssuf = 1;
6233       break;
6234     case LONG_MNEM_SUFFIX:
6235       suffix_check.no_lsuf = 1;
6236       break;
6237     case QWORD_MNEM_SUFFIX:
6238       suffix_check.no_qsuf = 1;
6239       break;
6240     default:
6241       /* NB: In Intel syntax, normally we can check for memory operand
6242          size when there is no mnemonic suffix.  But jmp and call have
6243          2 different encodings with Dword memory operand size, one with
6244          No_ldSuf and the other without.  i.suffix is set to
6245          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6246       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6247         suffix_check.no_ldsuf = 1;
6248     }
6249
6250   /* Must have right number of operands.  */
6251   i.error = number_of_operands_mismatch;
6252
6253   for (t = current_templates->start; t < current_templates->end; t++)
6254     {
6255       addr_prefix_disp = -1;
6256       found_reverse_match = 0;
6257
6258       if (i.operands != t->operands)
6259         continue;
6260
6261       /* Check processor support.  */
6262       i.error = unsupported;
6263       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6264         continue;
6265
6266       /* Check Pseudo Prefix.  */
6267       i.error = unsupported;
6268       if (t->opcode_modifier.pseudovexprefix
6269           && !(i.vec_encoding == vex_encoding_vex
6270               || i.vec_encoding == vex_encoding_vex3))
6271         continue;
6272
6273       /* Check AT&T mnemonic.   */
6274       i.error = unsupported_with_intel_mnemonic;
6275       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6276         continue;
6277
6278       /* Check AT&T/Intel syntax.  */
6279       i.error = unsupported_syntax;
6280       if ((intel_syntax && t->opcode_modifier.attsyntax)
6281           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6282         continue;
6283
6284       /* Check Intel64/AMD64 ISA.   */
6285       switch (isa64)
6286         {
6287         default:
6288           /* Default: Don't accept Intel64.  */
6289           if (t->opcode_modifier.isa64 == INTEL64)
6290             continue;
6291           break;
6292         case amd64:
6293           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6294           if (t->opcode_modifier.isa64 >= INTEL64)
6295             continue;
6296           break;
6297         case intel64:
6298           /* -mintel64: Don't accept AMD64.  */
6299           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6300             continue;
6301           break;
6302         }
6303
6304       /* Check the suffix.  */
6305       i.error = invalid_instruction_suffix;
6306       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6307           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6308           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6309           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6310           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6311           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6312         continue;
6313
6314       size_match = operand_size_match (t);
6315       if (!size_match)
6316         continue;
6317
6318       /* This is intentionally not
6319
6320          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6321
6322          as the case of a missing * on the operand is accepted (perhaps with
6323          a warning, issued further down).  */
6324       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6325         {
6326           i.error = operand_type_mismatch;
6327           continue;
6328         }
6329
6330       for (j = 0; j < MAX_OPERANDS; j++)
6331         operand_types[j] = t->operand_types[j];
6332
6333       /* In general, don't allow
6334          - 64-bit operands outside of 64-bit mode,
6335          - 32-bit operands on pre-386.  */
6336       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6337       if (((i.suffix == QWORD_MNEM_SUFFIX
6338             && flag_code != CODE_64BIT
6339             && !(t->base_opcode == 0xfc7
6340                  && i.tm.opcode_modifier.opcodeprefix == 0
6341                  && t->extension_opcode == 1) /* cmpxchg8b */)
6342            || (i.suffix == LONG_MNEM_SUFFIX
6343                && !cpu_arch_flags.bitfield.cpui386))
6344           && (intel_syntax
6345               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6346                  && !intel_float_operand (t->name))
6347               : intel_float_operand (t->name) != 2)
6348           && (t->operands == i.imm_operands
6349               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6350                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6351                && operand_types[i.imm_operands].bitfield.class != RegMask)
6352               || (operand_types[j].bitfield.class != RegMMX
6353                   && operand_types[j].bitfield.class != RegSIMD
6354                   && operand_types[j].bitfield.class != RegMask))
6355           && !t->opcode_modifier.sib)
6356         continue;
6357
6358       /* Do not verify operands when there are none.  */
6359       if (!t->operands)
6360         {
6361           if (VEX_check_encoding (t))
6362             {
6363               specific_error = i.error;
6364               continue;
6365             }
6366
6367           /* We've found a match; break out of loop.  */
6368           break;
6369         }
6370
6371       if (!t->opcode_modifier.jump
6372           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6373         {
6374           /* There should be only one Disp operand.  */
6375           for (j = 0; j < MAX_OPERANDS; j++)
6376             if (operand_type_check (operand_types[j], disp))
6377               break;
6378           if (j < MAX_OPERANDS)
6379             {
6380               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6381
6382               addr_prefix_disp = j;
6383
6384               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6385                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6386               switch (flag_code)
6387                 {
6388                 case CODE_16BIT:
6389                   override = !override;
6390                   /* Fall through.  */
6391                 case CODE_32BIT:
6392                   if (operand_types[j].bitfield.disp32
6393                       && operand_types[j].bitfield.disp16)
6394                     {
6395                       operand_types[j].bitfield.disp16 = override;
6396                       operand_types[j].bitfield.disp32 = !override;
6397                     }
6398                   operand_types[j].bitfield.disp32s = 0;
6399                   operand_types[j].bitfield.disp64 = 0;
6400                   break;
6401
6402                 case CODE_64BIT:
6403                   if (operand_types[j].bitfield.disp32s
6404                       || operand_types[j].bitfield.disp64)
6405                     {
6406                       operand_types[j].bitfield.disp64 &= !override;
6407                       operand_types[j].bitfield.disp32s &= !override;
6408                       operand_types[j].bitfield.disp32 = override;
6409                     }
6410                   operand_types[j].bitfield.disp16 = 0;
6411                   break;
6412                 }
6413             }
6414         }
6415
6416       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6417       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6418         continue;
6419
6420       /* We check register size if needed.  */
6421       if (t->opcode_modifier.checkregsize)
6422         {
6423           check_register = (1 << t->operands) - 1;
6424           if (i.broadcast)
6425             check_register &= ~(1 << i.broadcast->operand);
6426         }
6427       else
6428         check_register = 0;
6429
6430       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6431       switch (t->operands)
6432         {
6433         case 1:
6434           if (!operand_type_match (overlap0, i.types[0]))
6435             continue;
6436           break;
6437         case 2:
6438           /* xchg %eax, %eax is a special case. It is an alias for nop
6439              only in 32bit mode and we can use opcode 0x90.  In 64bit
6440              mode, we can't use 0x90 for xchg %eax, %eax since it should
6441              zero-extend %eax to %rax.  */
6442           if (flag_code == CODE_64BIT
6443               && t->base_opcode == 0x90
6444               && i.types[0].bitfield.instance == Accum
6445               && i.types[0].bitfield.dword
6446               && i.types[1].bitfield.instance == Accum
6447               && i.types[1].bitfield.dword)
6448             continue;
6449           /* xrelease mov %eax, <disp> is another special case. It must not
6450              match the accumulator-only encoding of mov.  */
6451           if (flag_code != CODE_64BIT
6452               && i.hle_prefix
6453               && t->base_opcode == 0xa0
6454               && i.types[0].bitfield.instance == Accum
6455               && (i.flags[1] & Operand_Mem))
6456             continue;
6457           /* Fall through.  */
6458
6459         case 3:
6460           if (!(size_match & MATCH_STRAIGHT))
6461             goto check_reverse;
6462           /* Reverse direction of operands if swapping is possible in the first
6463              place (operands need to be symmetric) and
6464              - the load form is requested, and the template is a store form,
6465              - the store form is requested, and the template is a load form,
6466              - the non-default (swapped) form is requested.  */
6467           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6468           if (t->opcode_modifier.d && i.reg_operands == i.operands
6469               && !operand_type_all_zero (&overlap1))
6470             switch (i.dir_encoding)
6471               {
6472               case dir_encoding_load:
6473                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6474                     || t->opcode_modifier.regmem)
6475                   goto check_reverse;
6476                 break;
6477
6478               case dir_encoding_store:
6479                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6480                     && !t->opcode_modifier.regmem)
6481                   goto check_reverse;
6482                 break;
6483
6484               case dir_encoding_swap:
6485                 goto check_reverse;
6486
6487               case dir_encoding_default:
6488                 break;
6489               }
6490           /* If we want store form, we skip the current load.  */
6491           if ((i.dir_encoding == dir_encoding_store
6492                || i.dir_encoding == dir_encoding_swap)
6493               && i.mem_operands == 0
6494               && t->opcode_modifier.load)
6495             continue;
6496           /* Fall through.  */
6497         case 4:
6498         case 5:
6499           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6500           if (!operand_type_match (overlap0, i.types[0])
6501               || !operand_type_match (overlap1, i.types[1])
6502               || ((check_register & 3) == 3
6503                   && !operand_type_register_match (i.types[0],
6504                                                    operand_types[0],
6505                                                    i.types[1],
6506                                                    operand_types[1])))
6507             {
6508               /* Check if other direction is valid ...  */
6509               if (!t->opcode_modifier.d)
6510                 continue;
6511
6512             check_reverse:
6513               if (!(size_match & MATCH_REVERSE))
6514                 continue;
6515               /* Try reversing direction of operands.  */
6516               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6517               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6518               if (!operand_type_match (overlap0, i.types[0])
6519                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6520                   || (check_register
6521                       && !operand_type_register_match (i.types[0],
6522                                                        operand_types[i.operands - 1],
6523                                                        i.types[i.operands - 1],
6524                                                        operand_types[0])))
6525                 {
6526                   /* Does not match either direction.  */
6527                   continue;
6528                 }
6529               /* found_reverse_match holds which of D or FloatR
6530                  we've found.  */
6531               if (!t->opcode_modifier.d)
6532                 found_reverse_match = 0;
6533               else if (operand_types[0].bitfield.tbyte)
6534                 found_reverse_match = Opcode_FloatD;
6535               else if (operand_types[0].bitfield.xmmword
6536                        || operand_types[i.operands - 1].bitfield.xmmword
6537                        || operand_types[0].bitfield.class == RegMMX
6538                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6539                        || is_any_vex_encoding(t))
6540                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6541                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6542               else
6543                 found_reverse_match = Opcode_D;
6544               if (t->opcode_modifier.floatr)
6545                 found_reverse_match |= Opcode_FloatR;
6546             }
6547           else
6548             {
6549               /* Found a forward 2 operand match here.  */
6550               switch (t->operands)
6551                 {
6552                 case 5:
6553                   overlap4 = operand_type_and (i.types[4],
6554                                                operand_types[4]);
6555                   /* Fall through.  */
6556                 case 4:
6557                   overlap3 = operand_type_and (i.types[3],
6558                                                operand_types[3]);
6559                   /* Fall through.  */
6560                 case 3:
6561                   overlap2 = operand_type_and (i.types[2],
6562                                                operand_types[2]);
6563                   break;
6564                 }
6565
6566               switch (t->operands)
6567                 {
6568                 case 5:
6569                   if (!operand_type_match (overlap4, i.types[4])
6570                       || !operand_type_register_match (i.types[3],
6571                                                        operand_types[3],
6572                                                        i.types[4],
6573                                                        operand_types[4]))
6574                     continue;
6575                   /* Fall through.  */
6576                 case 4:
6577                   if (!operand_type_match (overlap3, i.types[3])
6578                       || ((check_register & 0xa) == 0xa
6579                           && !operand_type_register_match (i.types[1],
6580                                                             operand_types[1],
6581                                                             i.types[3],
6582                                                             operand_types[3]))
6583                       || ((check_register & 0xc) == 0xc
6584                           && !operand_type_register_match (i.types[2],
6585                                                             operand_types[2],
6586                                                             i.types[3],
6587                                                             operand_types[3])))
6588                     continue;
6589                   /* Fall through.  */
6590                 case 3:
6591                   /* Here we make use of the fact that there are no
6592                      reverse match 3 operand instructions.  */
6593                   if (!operand_type_match (overlap2, i.types[2])
6594                       || ((check_register & 5) == 5
6595                           && !operand_type_register_match (i.types[0],
6596                                                             operand_types[0],
6597                                                             i.types[2],
6598                                                             operand_types[2]))
6599                       || ((check_register & 6) == 6
6600                           && !operand_type_register_match (i.types[1],
6601                                                             operand_types[1],
6602                                                             i.types[2],
6603                                                             operand_types[2])))
6604                     continue;
6605                   break;
6606                 }
6607             }
6608           /* Found either forward/reverse 2, 3 or 4 operand match here:
6609              slip through to break.  */
6610         }
6611
6612       /* Check if vector operands are valid.  */
6613       if (check_VecOperands (t))
6614         {
6615           specific_error = i.error;
6616           continue;
6617         }
6618
6619       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6620       if (VEX_check_encoding (t))
6621         {
6622           specific_error = i.error;
6623           continue;
6624         }
6625
6626       /* We've found a match; break out of loop.  */
6627       break;
6628     }
6629
6630   if (t == current_templates->end)
6631     {
6632       /* We found no match.  */
6633       const char *err_msg;
6634       switch (specific_error ? specific_error : i.error)
6635         {
6636         default:
6637           abort ();
6638         case operand_size_mismatch:
6639           err_msg = _("operand size mismatch");
6640           break;
6641         case operand_type_mismatch:
6642           err_msg = _("operand type mismatch");
6643           break;
6644         case register_type_mismatch:
6645           err_msg = _("register type mismatch");
6646           break;
6647         case number_of_operands_mismatch:
6648           err_msg = _("number of operands mismatch");
6649           break;
6650         case invalid_instruction_suffix:
6651           err_msg = _("invalid instruction suffix");
6652           break;
6653         case bad_imm4:
6654           err_msg = _("constant doesn't fit in 4 bits");
6655           break;
6656         case unsupported_with_intel_mnemonic:
6657           err_msg = _("unsupported with Intel mnemonic");
6658           break;
6659         case unsupported_syntax:
6660           err_msg = _("unsupported syntax");
6661           break;
6662         case unsupported:
6663           as_bad (_("unsupported instruction `%s'"),
6664                   current_templates->start->name);
6665           return NULL;
6666         case invalid_sib_address:
6667           err_msg = _("invalid SIB address");
6668           break;
6669         case invalid_vsib_address:
6670           err_msg = _("invalid VSIB address");
6671           break;
6672         case invalid_vector_register_set:
6673           err_msg = _("mask, index, and destination registers must be distinct");
6674           break;
6675         case invalid_tmm_register_set:
6676           err_msg = _("all tmm registers must be distinct");
6677           break;
6678         case unsupported_vector_index_register:
6679           err_msg = _("unsupported vector index register");
6680           break;
6681         case unsupported_broadcast:
6682           err_msg = _("unsupported broadcast");
6683           break;
6684         case broadcast_needed:
6685           err_msg = _("broadcast is needed for operand of such type");
6686           break;
6687         case unsupported_masking:
6688           err_msg = _("unsupported masking");
6689           break;
6690         case mask_not_on_destination:
6691           err_msg = _("mask not on destination operand");
6692           break;
6693         case no_default_mask:
6694           err_msg = _("default mask isn't allowed");
6695           break;
6696         case unsupported_rc_sae:
6697           err_msg = _("unsupported static rounding/sae");
6698           break;
6699         case rc_sae_operand_not_last_imm:
6700           if (intel_syntax)
6701             err_msg = _("RC/SAE operand must precede immediate operands");
6702           else
6703             err_msg = _("RC/SAE operand must follow immediate operands");
6704           break;
6705         case invalid_register_operand:
6706           err_msg = _("invalid register operand");
6707           break;
6708         }
6709       as_bad (_("%s for `%s'"), err_msg,
6710               current_templates->start->name);
6711       return NULL;
6712     }
6713
6714   if (!quiet_warnings)
6715     {
6716       if (!intel_syntax
6717           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6718         as_warn (_("indirect %s without `*'"), t->name);
6719
6720       if (t->opcode_modifier.isprefix
6721           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6722         {
6723           /* Warn them that a data or address size prefix doesn't
6724              affect assembly of the next line of code.  */
6725           as_warn (_("stand-alone `%s' prefix"), t->name);
6726         }
6727     }
6728
6729   /* Copy the template we found.  */
6730   i.tm = *t;
6731
6732   if (addr_prefix_disp != -1)
6733     i.tm.operand_types[addr_prefix_disp]
6734       = operand_types[addr_prefix_disp];
6735
6736   if (found_reverse_match)
6737     {
6738       /* If we found a reverse match we must alter the opcode direction
6739          bit and clear/flip the regmem modifier one.  found_reverse_match
6740          holds bits to change (different for int & float insns).  */
6741
6742       i.tm.base_opcode ^= found_reverse_match;
6743
6744       i.tm.operand_types[0] = operand_types[i.operands - 1];
6745       i.tm.operand_types[i.operands - 1] = operand_types[0];
6746
6747       /* Certain SIMD insns have their load forms specified in the opcode
6748          table, and hence we need to _set_ RegMem instead of clearing it.
6749          We need to avoid setting the bit though on insns like KMOVW.  */
6750       i.tm.opcode_modifier.regmem
6751         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6752           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6753           && !i.tm.opcode_modifier.regmem;
6754     }
6755
6756   return t;
6757 }
6758
6759 static int
6760 check_string (void)
6761 {
6762   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6763   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6764
6765   if (i.seg[op] != NULL && i.seg[op] != &es)
6766     {
6767       as_bad (_("`%s' operand %u must use `%ses' segment"),
6768               i.tm.name,
6769               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6770               register_prefix);
6771       return 0;
6772     }
6773
6774   /* There's only ever one segment override allowed per instruction.
6775      This instruction possibly has a legal segment override on the
6776      second operand, so copy the segment to where non-string
6777      instructions store it, allowing common code.  */
6778   i.seg[op] = i.seg[1];
6779
6780   return 1;
6781 }
6782
6783 static int
6784 process_suffix (void)
6785 {
6786   bfd_boolean is_crc32 = FALSE;
6787
6788   /* If matched instruction specifies an explicit instruction mnemonic
6789      suffix, use it.  */
6790   if (i.tm.opcode_modifier.size == SIZE16)
6791     i.suffix = WORD_MNEM_SUFFIX;
6792   else if (i.tm.opcode_modifier.size == SIZE32)
6793     i.suffix = LONG_MNEM_SUFFIX;
6794   else if (i.tm.opcode_modifier.size == SIZE64)
6795     i.suffix = QWORD_MNEM_SUFFIX;
6796   else if (i.reg_operands
6797            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6798            && !i.tm.opcode_modifier.addrprefixopreg)
6799     {
6800       unsigned int numop = i.operands;
6801       /* CRC32 */
6802       is_crc32 = (i.tm.base_opcode == 0xf38f0
6803                   && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6804
6805       /* movsx/movzx want only their source operand considered here, for the
6806          ambiguity checking below.  The suffix will be replaced afterwards
6807          to represent the destination (register).  */
6808       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6809           || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6810         --i.operands;
6811
6812       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6813       if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
6814         i.rex |= REX_W;
6815
6816       /* If there's no instruction mnemonic suffix we try to invent one
6817          based on GPR operands.  */
6818       if (!i.suffix)
6819         {
6820           /* We take i.suffix from the last register operand specified,
6821              Destination register type is more significant than source
6822              register type.  crc32 in SSE4.2 prefers source register
6823              type. */
6824           unsigned int op = is_crc32 ? 1 : i.operands;
6825
6826           while (op--)
6827             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6828                 || i.tm.operand_types[op].bitfield.instance == Accum)
6829               {
6830                 if (i.types[op].bitfield.class != Reg)
6831                   continue;
6832                 if (i.types[op].bitfield.byte)
6833                   i.suffix = BYTE_MNEM_SUFFIX;
6834                 else if (i.types[op].bitfield.word)
6835                   i.suffix = WORD_MNEM_SUFFIX;
6836                 else if (i.types[op].bitfield.dword)
6837                   i.suffix = LONG_MNEM_SUFFIX;
6838                 else if (i.types[op].bitfield.qword)
6839                   i.suffix = QWORD_MNEM_SUFFIX;
6840                 else
6841                   continue;
6842                 break;
6843               }
6844
6845           /* As an exception, movsx/movzx silently default to a byte source
6846              in AT&T mode.  */
6847           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6848               && !i.suffix && !intel_syntax)
6849             i.suffix = BYTE_MNEM_SUFFIX;
6850         }
6851       else if (i.suffix == BYTE_MNEM_SUFFIX)
6852         {
6853           if (intel_syntax
6854               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6855               && i.tm.opcode_modifier.no_bsuf)
6856             i.suffix = 0;
6857           else if (!check_byte_reg ())
6858             return 0;
6859         }
6860       else if (i.suffix == LONG_MNEM_SUFFIX)
6861         {
6862           if (intel_syntax
6863               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6864               && i.tm.opcode_modifier.no_lsuf
6865               && !i.tm.opcode_modifier.todword
6866               && !i.tm.opcode_modifier.toqword)
6867             i.suffix = 0;
6868           else if (!check_long_reg ())
6869             return 0;
6870         }
6871       else if (i.suffix == QWORD_MNEM_SUFFIX)
6872         {
6873           if (intel_syntax
6874               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6875               && i.tm.opcode_modifier.no_qsuf
6876               && !i.tm.opcode_modifier.todword
6877               && !i.tm.opcode_modifier.toqword)
6878             i.suffix = 0;
6879           else if (!check_qword_reg ())
6880             return 0;
6881         }
6882       else if (i.suffix == WORD_MNEM_SUFFIX)
6883         {
6884           if (intel_syntax
6885               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6886               && i.tm.opcode_modifier.no_wsuf)
6887             i.suffix = 0;
6888           else if (!check_word_reg ())
6889             return 0;
6890         }
6891       else if (intel_syntax
6892                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6893         /* Do nothing if the instruction is going to ignore the prefix.  */
6894         ;
6895       else
6896         abort ();
6897
6898       /* Undo the movsx/movzx change done above.  */
6899       i.operands = numop;
6900     }
6901   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6902            && !i.suffix)
6903     {
6904       i.suffix = stackop_size;
6905       if (stackop_size == LONG_MNEM_SUFFIX)
6906         {
6907           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6908              .code16gcc directive to support 16-bit mode with
6909              32-bit address.  For IRET without a suffix, generate
6910              16-bit IRET (opcode 0xcf) to return from an interrupt
6911              handler.  */
6912           if (i.tm.base_opcode == 0xcf)
6913             {
6914               i.suffix = WORD_MNEM_SUFFIX;
6915               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6916             }
6917           /* Warn about changed behavior for segment register push/pop.  */
6918           else if ((i.tm.base_opcode | 1) == 0x07)
6919             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6920                      i.tm.name);
6921         }
6922     }
6923   else if (!i.suffix
6924            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6925                || i.tm.opcode_modifier.jump == JUMP_BYTE
6926                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6927                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6928                    && i.tm.extension_opcode <= 3)))
6929     {
6930       switch (flag_code)
6931         {
6932         case CODE_64BIT:
6933           if (!i.tm.opcode_modifier.no_qsuf)
6934             {
6935               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6936                   || i.tm.opcode_modifier.no_lsuf)
6937                 i.suffix = QWORD_MNEM_SUFFIX;
6938               break;
6939             }
6940           /* Fall through.  */
6941         case CODE_32BIT:
6942           if (!i.tm.opcode_modifier.no_lsuf)
6943             i.suffix = LONG_MNEM_SUFFIX;
6944           break;
6945         case CODE_16BIT:
6946           if (!i.tm.opcode_modifier.no_wsuf)
6947             i.suffix = WORD_MNEM_SUFFIX;
6948           break;
6949         }
6950     }
6951
6952   if (!i.suffix
6953       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6954           /* Also cover lret/retf/iret in 64-bit mode.  */
6955           || (flag_code == CODE_64BIT
6956               && !i.tm.opcode_modifier.no_lsuf
6957               && !i.tm.opcode_modifier.no_qsuf))
6958       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6959       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6960       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6961       /* Accept FLDENV et al without suffix.  */
6962       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6963     {
6964       unsigned int suffixes, evex = 0;
6965
6966       suffixes = !i.tm.opcode_modifier.no_bsuf;
6967       if (!i.tm.opcode_modifier.no_wsuf)
6968         suffixes |= 1 << 1;
6969       if (!i.tm.opcode_modifier.no_lsuf)
6970         suffixes |= 1 << 2;
6971       if (!i.tm.opcode_modifier.no_ldsuf)
6972         suffixes |= 1 << 3;
6973       if (!i.tm.opcode_modifier.no_ssuf)
6974         suffixes |= 1 << 4;
6975       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6976         suffixes |= 1 << 5;
6977
6978       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6979          also suitable for AT&T syntax mode, it was requested that this be
6980          restricted to just Intel syntax.  */
6981       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6982         {
6983           unsigned int op;
6984
6985           for (op = 0; op < i.tm.operands; ++op)
6986             {
6987               if (is_evex_encoding (&i.tm)
6988                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6989                 {
6990                   if (i.tm.operand_types[op].bitfield.ymmword)
6991                     i.tm.operand_types[op].bitfield.xmmword = 0;
6992                   if (i.tm.operand_types[op].bitfield.zmmword)
6993                     i.tm.operand_types[op].bitfield.ymmword = 0;
6994                   if (!i.tm.opcode_modifier.evex
6995                       || i.tm.opcode_modifier.evex == EVEXDYN)
6996                     i.tm.opcode_modifier.evex = EVEX512;
6997                 }
6998
6999               if (i.tm.operand_types[op].bitfield.xmmword
7000                   + i.tm.operand_types[op].bitfield.ymmword
7001                   + i.tm.operand_types[op].bitfield.zmmword < 2)
7002                 continue;
7003
7004               /* Any properly sized operand disambiguates the insn.  */
7005               if (i.types[op].bitfield.xmmword
7006                   || i.types[op].bitfield.ymmword
7007                   || i.types[op].bitfield.zmmword)
7008                 {
7009                   suffixes &= ~(7 << 6);
7010                   evex = 0;
7011                   break;
7012                 }
7013
7014               if ((i.flags[op] & Operand_Mem)
7015                   && i.tm.operand_types[op].bitfield.unspecified)
7016                 {
7017                   if (i.tm.operand_types[op].bitfield.xmmword)
7018                     suffixes |= 1 << 6;
7019                   if (i.tm.operand_types[op].bitfield.ymmword)
7020                     suffixes |= 1 << 7;
7021                   if (i.tm.operand_types[op].bitfield.zmmword)
7022                     suffixes |= 1 << 8;
7023                   if (is_evex_encoding (&i.tm))
7024                     evex = EVEX512;
7025                 }
7026             }
7027         }
7028
7029       /* Are multiple suffixes / operand sizes allowed?  */
7030       if (suffixes & (suffixes - 1))
7031         {
7032           if (intel_syntax
7033               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7034                   || operand_check == check_error))
7035             {
7036               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
7037               return 0;
7038             }
7039           if (operand_check == check_error)
7040             {
7041               as_bad (_("no instruction mnemonic suffix given and "
7042                         "no register operands; can't size `%s'"), i.tm.name);
7043               return 0;
7044             }
7045           if (operand_check == check_warning)
7046             as_warn (_("%s; using default for `%s'"),
7047                        intel_syntax
7048                        ? _("ambiguous operand size")
7049                        : _("no instruction mnemonic suffix given and "
7050                            "no register operands"),
7051                        i.tm.name);
7052
7053           if (i.tm.opcode_modifier.floatmf)
7054             i.suffix = SHORT_MNEM_SUFFIX;
7055           else if ((i.tm.base_opcode | 8) == 0xfbe
7056                    || (i.tm.base_opcode == 0x63
7057                        && i.tm.cpu_flags.bitfield.cpu64))
7058             /* handled below */;
7059           else if (evex)
7060             i.tm.opcode_modifier.evex = evex;
7061           else if (flag_code == CODE_16BIT)
7062             i.suffix = WORD_MNEM_SUFFIX;
7063           else if (!i.tm.opcode_modifier.no_lsuf)
7064             i.suffix = LONG_MNEM_SUFFIX;
7065           else
7066             i.suffix = QWORD_MNEM_SUFFIX;
7067         }
7068     }
7069
7070   if ((i.tm.base_opcode | 8) == 0xfbe
7071       || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7072     {
7073       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7074          In AT&T syntax, if there is no suffix (warned about above), the default
7075          will be byte extension.  */
7076       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7077         i.tm.base_opcode |= 1;
7078
7079       /* For further processing, the suffix should represent the destination
7080          (register).  This is already the case when one was used with
7081          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7082          no suffix to begin with.  */
7083       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7084         {
7085           if (i.types[1].bitfield.word)
7086             i.suffix = WORD_MNEM_SUFFIX;
7087           else if (i.types[1].bitfield.qword)
7088             i.suffix = QWORD_MNEM_SUFFIX;
7089           else
7090             i.suffix = LONG_MNEM_SUFFIX;
7091
7092           i.tm.opcode_modifier.w = 0;
7093         }
7094     }
7095
7096   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7097     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7098                    != (i.tm.operand_types[1].bitfield.class == Reg);
7099
7100   /* Change the opcode based on the operand size given by i.suffix.  */
7101   switch (i.suffix)
7102     {
7103     /* Size floating point instruction.  */
7104     case LONG_MNEM_SUFFIX:
7105       if (i.tm.opcode_modifier.floatmf)
7106         {
7107           i.tm.base_opcode ^= 4;
7108           break;
7109         }
7110     /* fall through */
7111     case WORD_MNEM_SUFFIX:
7112     case QWORD_MNEM_SUFFIX:
7113       /* It's not a byte, select word/dword operation.  */
7114       if (i.tm.opcode_modifier.w)
7115         {
7116           if (i.short_form)
7117             i.tm.base_opcode |= 8;
7118           else
7119             i.tm.base_opcode |= 1;
7120         }
7121     /* fall through */
7122     case SHORT_MNEM_SUFFIX:
7123       /* Now select between word & dword operations via the operand
7124          size prefix, except for instructions that will ignore this
7125          prefix anyway.  */
7126       if (i.suffix != QWORD_MNEM_SUFFIX
7127           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7128           && !i.tm.opcode_modifier.floatmf
7129           && !is_any_vex_encoding (&i.tm)
7130           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7131               || (flag_code == CODE_64BIT
7132                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7133         {
7134           unsigned int prefix = DATA_PREFIX_OPCODE;
7135
7136           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7137             prefix = ADDR_PREFIX_OPCODE;
7138
7139           if (!add_prefix (prefix))
7140             return 0;
7141         }
7142
7143       /* Set mode64 for an operand.  */
7144       if (i.suffix == QWORD_MNEM_SUFFIX
7145           && flag_code == CODE_64BIT
7146           && !i.tm.opcode_modifier.norex64
7147           && !i.tm.opcode_modifier.vexw
7148           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7149              need rex64. */
7150           && ! (i.operands == 2
7151                 && i.tm.base_opcode == 0x90
7152                 && i.tm.extension_opcode == None
7153                 && i.types[0].bitfield.instance == Accum
7154                 && i.types[0].bitfield.qword
7155                 && i.types[1].bitfield.instance == Accum
7156                 && i.types[1].bitfield.qword))
7157         i.rex |= REX_W;
7158
7159       break;
7160
7161     case 0:
7162       /* Select word/dword/qword operation with explicit data sizing prefix
7163          when there are no suitable register operands.  */
7164       if (i.tm.opcode_modifier.w
7165           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7166           && (!i.reg_operands
7167               || (i.reg_operands == 1
7168                       /* ShiftCount */
7169                   && (i.tm.operand_types[0].bitfield.instance == RegC
7170                       /* InOutPortReg */
7171                       || i.tm.operand_types[0].bitfield.instance == RegD
7172                       || i.tm.operand_types[1].bitfield.instance == RegD
7173                       /* CRC32 */
7174                       || is_crc32))))
7175         i.tm.base_opcode |= 1;
7176       break;
7177     }
7178
7179   if (i.tm.opcode_modifier.addrprefixopreg)
7180     {
7181       gas_assert (!i.suffix);
7182       gas_assert (i.reg_operands);
7183
7184       if (i.tm.operand_types[0].bitfield.instance == Accum
7185           || i.operands == 1)
7186         {
7187           /* The address size override prefix changes the size of the
7188              first operand.  */
7189           if (flag_code == CODE_64BIT
7190               && i.op[0].regs->reg_type.bitfield.word)
7191             {
7192               as_bad (_("16-bit addressing unavailable for `%s'"),
7193                       i.tm.name);
7194               return 0;
7195             }
7196
7197           if ((flag_code == CODE_32BIT
7198                ? i.op[0].regs->reg_type.bitfield.word
7199                : i.op[0].regs->reg_type.bitfield.dword)
7200               && !add_prefix (ADDR_PREFIX_OPCODE))
7201             return 0;
7202         }
7203       else
7204         {
7205           /* Check invalid register operand when the address size override
7206              prefix changes the size of register operands.  */
7207           unsigned int op;
7208           enum { need_word, need_dword, need_qword } need;
7209
7210           /* Check the register operand for the address size prefix if
7211              the memory operand has no real registers, like symbol, DISP
7212              or symbol(%rip).  */
7213           if (i.mem_operands == 1
7214               && i.reg_operands == 1
7215               && i.operands == 2
7216               && i.types[1].bitfield.class == Reg
7217               && (flag_code == CODE_32BIT
7218                   ? i.op[1].regs->reg_type.bitfield.word
7219                   : i.op[1].regs->reg_type.bitfield.dword)
7220               && ((i.base_reg == NULL && i.index_reg == NULL)
7221                   || (i.base_reg
7222                       && i.base_reg->reg_num == RegIP
7223                       && i.base_reg->reg_type.bitfield.qword))
7224               && !add_prefix (ADDR_PREFIX_OPCODE))
7225             return 0;
7226
7227           if (flag_code == CODE_32BIT)
7228             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7229           else if (i.prefix[ADDR_PREFIX])
7230             need = need_dword;
7231           else
7232             need = flag_code == CODE_64BIT ? need_qword : need_word;
7233
7234           for (op = 0; op < i.operands; op++)
7235             {
7236               if (i.types[op].bitfield.class != Reg)
7237                 continue;
7238
7239               switch (need)
7240                 {
7241                 case need_word:
7242                   if (i.op[op].regs->reg_type.bitfield.word)
7243                     continue;
7244                   break;
7245                 case need_dword:
7246                   if (i.op[op].regs->reg_type.bitfield.dword)
7247                     continue;
7248                   break;
7249                 case need_qword:
7250                   if (i.op[op].regs->reg_type.bitfield.qword)
7251                     continue;
7252                   break;
7253                 }
7254
7255               as_bad (_("invalid register operand size for `%s'"),
7256                       i.tm.name);
7257               return 0;
7258             }
7259         }
7260     }
7261
7262   return 1;
7263 }
7264
7265 static int
7266 check_byte_reg (void)
7267 {
7268   int op;
7269
7270   for (op = i.operands; --op >= 0;)
7271     {
7272       /* Skip non-register operands. */
7273       if (i.types[op].bitfield.class != Reg)
7274         continue;
7275
7276       /* If this is an eight bit register, it's OK.  If it's the 16 or
7277          32 bit version of an eight bit register, we will just use the
7278          low portion, and that's OK too.  */
7279       if (i.types[op].bitfield.byte)
7280         continue;
7281
7282       /* I/O port address operands are OK too.  */
7283       if (i.tm.operand_types[op].bitfield.instance == RegD
7284           && i.tm.operand_types[op].bitfield.word)
7285         continue;
7286
7287       /* crc32 only wants its source operand checked here.  */
7288       if (i.tm.base_opcode == 0xf38f0
7289           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7290           && op != 0)
7291         continue;
7292
7293       /* Any other register is bad.  */
7294       as_bad (_("`%s%s' not allowed with `%s%c'"),
7295               register_prefix, i.op[op].regs->reg_name,
7296               i.tm.name, i.suffix);
7297       return 0;
7298     }
7299   return 1;
7300 }
7301
7302 static int
7303 check_long_reg (void)
7304 {
7305   int op;
7306
7307   for (op = i.operands; --op >= 0;)
7308     /* Skip non-register operands. */
7309     if (i.types[op].bitfield.class != Reg)
7310       continue;
7311     /* Reject eight bit registers, except where the template requires
7312        them. (eg. movzb)  */
7313     else if (i.types[op].bitfield.byte
7314              && (i.tm.operand_types[op].bitfield.class == Reg
7315                  || i.tm.operand_types[op].bitfield.instance == Accum)
7316              && (i.tm.operand_types[op].bitfield.word
7317                  || i.tm.operand_types[op].bitfield.dword))
7318       {
7319         as_bad (_("`%s%s' not allowed with `%s%c'"),
7320                 register_prefix,
7321                 i.op[op].regs->reg_name,
7322                 i.tm.name,
7323                 i.suffix);
7324         return 0;
7325       }
7326     /* Error if the e prefix on a general reg is missing.  */
7327     else if (i.types[op].bitfield.word
7328              && (i.tm.operand_types[op].bitfield.class == Reg
7329                  || i.tm.operand_types[op].bitfield.instance == Accum)
7330              && i.tm.operand_types[op].bitfield.dword)
7331       {
7332         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7333                 register_prefix, i.op[op].regs->reg_name,
7334                 i.suffix);
7335         return 0;
7336       }
7337     /* Warn if the r prefix on a general reg is present.  */
7338     else if (i.types[op].bitfield.qword
7339              && (i.tm.operand_types[op].bitfield.class == Reg
7340                  || i.tm.operand_types[op].bitfield.instance == Accum)
7341              && i.tm.operand_types[op].bitfield.dword)
7342       {
7343         if (intel_syntax
7344             && i.tm.opcode_modifier.toqword
7345             && i.types[0].bitfield.class != RegSIMD)
7346           {
7347             /* Convert to QWORD.  We want REX byte. */
7348             i.suffix = QWORD_MNEM_SUFFIX;
7349           }
7350         else
7351           {
7352             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7353                     register_prefix, i.op[op].regs->reg_name,
7354                     i.suffix);
7355             return 0;
7356           }
7357       }
7358   return 1;
7359 }
7360
7361 static int
7362 check_qword_reg (void)
7363 {
7364   int op;
7365
7366   for (op = i.operands; --op >= 0; )
7367     /* Skip non-register operands. */
7368     if (i.types[op].bitfield.class != Reg)
7369       continue;
7370     /* Reject eight bit registers, except where the template requires
7371        them. (eg. movzb)  */
7372     else if (i.types[op].bitfield.byte
7373              && (i.tm.operand_types[op].bitfield.class == Reg
7374                  || i.tm.operand_types[op].bitfield.instance == Accum)
7375              && (i.tm.operand_types[op].bitfield.word
7376                  || i.tm.operand_types[op].bitfield.dword))
7377       {
7378         as_bad (_("`%s%s' not allowed with `%s%c'"),
7379                 register_prefix,
7380                 i.op[op].regs->reg_name,
7381                 i.tm.name,
7382                 i.suffix);
7383         return 0;
7384       }
7385     /* Warn if the r prefix on a general reg is missing.  */
7386     else if ((i.types[op].bitfield.word
7387               || i.types[op].bitfield.dword)
7388              && (i.tm.operand_types[op].bitfield.class == Reg
7389                  || i.tm.operand_types[op].bitfield.instance == Accum)
7390              && i.tm.operand_types[op].bitfield.qword)
7391       {
7392         /* Prohibit these changes in the 64bit mode, since the
7393            lowering is more complicated.  */
7394         if (intel_syntax
7395             && i.tm.opcode_modifier.todword
7396             && i.types[0].bitfield.class != RegSIMD)
7397           {
7398             /* Convert to DWORD.  We don't want REX byte. */
7399             i.suffix = LONG_MNEM_SUFFIX;
7400           }
7401         else
7402           {
7403             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7404                     register_prefix, i.op[op].regs->reg_name,
7405                     i.suffix);
7406             return 0;
7407           }
7408       }
7409   return 1;
7410 }
7411
7412 static int
7413 check_word_reg (void)
7414 {
7415   int op;
7416   for (op = i.operands; --op >= 0;)
7417     /* Skip non-register operands. */
7418     if (i.types[op].bitfield.class != Reg)
7419       continue;
7420     /* Reject eight bit registers, except where the template requires
7421        them. (eg. movzb)  */
7422     else if (i.types[op].bitfield.byte
7423              && (i.tm.operand_types[op].bitfield.class == Reg
7424                  || i.tm.operand_types[op].bitfield.instance == Accum)
7425              && (i.tm.operand_types[op].bitfield.word
7426                  || i.tm.operand_types[op].bitfield.dword))
7427       {
7428         as_bad (_("`%s%s' not allowed with `%s%c'"),
7429                 register_prefix,
7430                 i.op[op].regs->reg_name,
7431                 i.tm.name,
7432                 i.suffix);
7433         return 0;
7434       }
7435     /* Error if the e or r prefix on a general reg is present.  */
7436     else if ((i.types[op].bitfield.dword
7437                  || i.types[op].bitfield.qword)
7438              && (i.tm.operand_types[op].bitfield.class == Reg
7439                  || i.tm.operand_types[op].bitfield.instance == Accum)
7440              && i.tm.operand_types[op].bitfield.word)
7441       {
7442         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7443                 register_prefix, i.op[op].regs->reg_name,
7444                 i.suffix);
7445         return 0;
7446       }
7447   return 1;
7448 }
7449
7450 static int
7451 update_imm (unsigned int j)
7452 {
7453   i386_operand_type overlap = i.types[j];
7454   if ((overlap.bitfield.imm8
7455        || overlap.bitfield.imm8s
7456        || overlap.bitfield.imm16
7457        || overlap.bitfield.imm32
7458        || overlap.bitfield.imm32s
7459        || overlap.bitfield.imm64)
7460       && !operand_type_equal (&overlap, &imm8)
7461       && !operand_type_equal (&overlap, &imm8s)
7462       && !operand_type_equal (&overlap, &imm16)
7463       && !operand_type_equal (&overlap, &imm32)
7464       && !operand_type_equal (&overlap, &imm32s)
7465       && !operand_type_equal (&overlap, &imm64))
7466     {
7467       if (i.suffix)
7468         {
7469           i386_operand_type temp;
7470
7471           operand_type_set (&temp, 0);
7472           if (i.suffix == BYTE_MNEM_SUFFIX)
7473             {
7474               temp.bitfield.imm8 = overlap.bitfield.imm8;
7475               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7476             }
7477           else if (i.suffix == WORD_MNEM_SUFFIX)
7478             temp.bitfield.imm16 = overlap.bitfield.imm16;
7479           else if (i.suffix == QWORD_MNEM_SUFFIX)
7480             {
7481               temp.bitfield.imm64 = overlap.bitfield.imm64;
7482               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7483             }
7484           else
7485             temp.bitfield.imm32 = overlap.bitfield.imm32;
7486           overlap = temp;
7487         }
7488       else if (operand_type_equal (&overlap, &imm16_32_32s)
7489                || operand_type_equal (&overlap, &imm16_32)
7490                || operand_type_equal (&overlap, &imm16_32s))
7491         {
7492           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7493             overlap = imm16;
7494           else
7495             overlap = imm32s;
7496         }
7497       else if (i.prefix[REX_PREFIX] & REX_W)
7498         overlap = operand_type_and (overlap, imm32s);
7499       else if (i.prefix[DATA_PREFIX])
7500         overlap = operand_type_and (overlap,
7501                                     flag_code != CODE_16BIT ? imm16 : imm32);
7502       if (!operand_type_equal (&overlap, &imm8)
7503           && !operand_type_equal (&overlap, &imm8s)
7504           && !operand_type_equal (&overlap, &imm16)
7505           && !operand_type_equal (&overlap, &imm32)
7506           && !operand_type_equal (&overlap, &imm32s)
7507           && !operand_type_equal (&overlap, &imm64))
7508         {
7509           as_bad (_("no instruction mnemonic suffix given; "
7510                     "can't determine immediate size"));
7511           return 0;
7512         }
7513     }
7514   i.types[j] = overlap;
7515
7516   return 1;
7517 }
7518
7519 static int
7520 finalize_imm (void)
7521 {
7522   unsigned int j, n;
7523
7524   /* Update the first 2 immediate operands.  */
7525   n = i.operands > 2 ? 2 : i.operands;
7526   if (n)
7527     {
7528       for (j = 0; j < n; j++)
7529         if (update_imm (j) == 0)
7530           return 0;
7531
7532       /* The 3rd operand can't be immediate operand.  */
7533       gas_assert (operand_type_check (i.types[2], imm) == 0);
7534     }
7535
7536   return 1;
7537 }
7538
7539 static int
7540 process_operands (void)
7541 {
7542   /* Default segment register this instruction will use for memory
7543      accesses.  0 means unknown.  This is only for optimizing out
7544      unnecessary segment overrides.  */
7545   const seg_entry *default_seg = 0;
7546
7547   if (i.tm.opcode_modifier.sse2avx)
7548     {
7549       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7550          need converting.  */
7551       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7552       i.prefix[REX_PREFIX] = 0;
7553       i.rex_encoding = 0;
7554     }
7555   /* ImmExt should be processed after SSE2AVX.  */
7556   else if (i.tm.opcode_modifier.immext)
7557     process_immext ();
7558
7559   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7560     {
7561       unsigned int dupl = i.operands;
7562       unsigned int dest = dupl - 1;
7563       unsigned int j;
7564
7565       /* The destination must be an xmm register.  */
7566       gas_assert (i.reg_operands
7567                   && MAX_OPERANDS > dupl
7568                   && operand_type_equal (&i.types[dest], &regxmm));
7569
7570       if (i.tm.operand_types[0].bitfield.instance == Accum
7571           && i.tm.operand_types[0].bitfield.xmmword)
7572         {
7573           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7574             {
7575               /* Keep xmm0 for instructions with VEX prefix and 3
7576                  sources.  */
7577               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7578               i.tm.operand_types[0].bitfield.class = RegSIMD;
7579               goto duplicate;
7580             }
7581           else
7582             {
7583               /* We remove the first xmm0 and keep the number of
7584                  operands unchanged, which in fact duplicates the
7585                  destination.  */
7586               for (j = 1; j < i.operands; j++)
7587                 {
7588                   i.op[j - 1] = i.op[j];
7589                   i.types[j - 1] = i.types[j];
7590                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7591                   i.flags[j - 1] = i.flags[j];
7592                 }
7593             }
7594         }
7595       else if (i.tm.opcode_modifier.implicit1stxmm0)
7596         {
7597           gas_assert ((MAX_OPERANDS - 1) > dupl
7598                       && (i.tm.opcode_modifier.vexsources
7599                           == VEX3SOURCES));
7600
7601           /* Add the implicit xmm0 for instructions with VEX prefix
7602              and 3 sources.  */
7603           for (j = i.operands; j > 0; j--)
7604             {
7605               i.op[j] = i.op[j - 1];
7606               i.types[j] = i.types[j - 1];
7607               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7608               i.flags[j] = i.flags[j - 1];
7609             }
7610           i.op[0].regs
7611             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7612           i.types[0] = regxmm;
7613           i.tm.operand_types[0] = regxmm;
7614
7615           i.operands += 2;
7616           i.reg_operands += 2;
7617           i.tm.operands += 2;
7618
7619           dupl++;
7620           dest++;
7621           i.op[dupl] = i.op[dest];
7622           i.types[dupl] = i.types[dest];
7623           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7624           i.flags[dupl] = i.flags[dest];
7625         }
7626       else
7627         {
7628         duplicate:
7629           i.operands++;
7630           i.reg_operands++;
7631           i.tm.operands++;
7632
7633           i.op[dupl] = i.op[dest];
7634           i.types[dupl] = i.types[dest];
7635           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7636           i.flags[dupl] = i.flags[dest];
7637         }
7638
7639        if (i.tm.opcode_modifier.immext)
7640          process_immext ();
7641     }
7642   else if (i.tm.operand_types[0].bitfield.instance == Accum
7643            && i.tm.operand_types[0].bitfield.xmmword)
7644     {
7645       unsigned int j;
7646
7647       for (j = 1; j < i.operands; j++)
7648         {
7649           i.op[j - 1] = i.op[j];
7650           i.types[j - 1] = i.types[j];
7651
7652           /* We need to adjust fields in i.tm since they are used by
7653              build_modrm_byte.  */
7654           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7655
7656           i.flags[j - 1] = i.flags[j];
7657         }
7658
7659       i.operands--;
7660       i.reg_operands--;
7661       i.tm.operands--;
7662     }
7663   else if (i.tm.opcode_modifier.implicitquadgroup)
7664     {
7665       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7666
7667       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7668       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7669       regnum = register_number (i.op[1].regs);
7670       first_reg_in_group = regnum & ~3;
7671       last_reg_in_group = first_reg_in_group + 3;
7672       if (regnum != first_reg_in_group)
7673         as_warn (_("source register `%s%s' implicitly denotes"
7674                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7675                  register_prefix, i.op[1].regs->reg_name,
7676                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7677                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7678                  i.tm.name);
7679     }
7680   else if (i.tm.opcode_modifier.regkludge)
7681     {
7682       /* The imul $imm, %reg instruction is converted into
7683          imul $imm, %reg, %reg, and the clr %reg instruction
7684          is converted into xor %reg, %reg.  */
7685
7686       unsigned int first_reg_op;
7687
7688       if (operand_type_check (i.types[0], reg))
7689         first_reg_op = 0;
7690       else
7691         first_reg_op = 1;
7692       /* Pretend we saw the extra register operand.  */
7693       gas_assert (i.reg_operands == 1
7694                   && i.op[first_reg_op + 1].regs == 0);
7695       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7696       i.types[first_reg_op + 1] = i.types[first_reg_op];
7697       i.operands++;
7698       i.reg_operands++;
7699     }
7700
7701   if (i.tm.opcode_modifier.modrm)
7702     {
7703       /* The opcode is completed (modulo i.tm.extension_opcode which
7704          must be put into the modrm byte).  Now, we make the modrm and
7705          index base bytes based on all the info we've collected.  */
7706
7707       default_seg = build_modrm_byte ();
7708     }
7709   else if (i.types[0].bitfield.class == SReg)
7710     {
7711       if (flag_code != CODE_64BIT
7712           ? i.tm.base_opcode == POP_SEG_SHORT
7713             && i.op[0].regs->reg_num == 1
7714           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7715             && i.op[0].regs->reg_num < 4)
7716         {
7717           as_bad (_("you can't `%s %s%s'"),
7718                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7719           return 0;
7720         }
7721       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7722         {
7723           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7724           i.tm.opcode_length = 2;
7725         }
7726       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7727     }
7728   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7729     {
7730       default_seg = &ds;
7731     }
7732   else if (i.tm.opcode_modifier.isstring)
7733     {
7734       /* For the string instructions that allow a segment override
7735          on one of their operands, the default segment is ds.  */
7736       default_seg = &ds;
7737     }
7738   else if (i.short_form)
7739     {
7740       /* The register or float register operand is in operand
7741          0 or 1.  */
7742       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7743
7744       /* Register goes in low 3 bits of opcode.  */
7745       i.tm.base_opcode |= i.op[op].regs->reg_num;
7746       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7747         i.rex |= REX_B;
7748       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7749         {
7750           /* Warn about some common errors, but press on regardless.
7751              The first case can be generated by gcc (<= 2.8.1).  */
7752           if (i.operands == 2)
7753             {
7754               /* Reversed arguments on faddp, fsubp, etc.  */
7755               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7756                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7757                        register_prefix, i.op[intel_syntax].regs->reg_name);
7758             }
7759           else
7760             {
7761               /* Extraneous `l' suffix on fp insn.  */
7762               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7763                        register_prefix, i.op[0].regs->reg_name);
7764             }
7765         }
7766     }
7767
7768   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7769       && i.tm.base_opcode == 0x8d /* lea */
7770       && !is_any_vex_encoding(&i.tm))
7771     {
7772       if (!quiet_warnings)
7773         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7774       if (optimize)
7775         {
7776           i.seg[0] = NULL;
7777           i.prefix[SEG_PREFIX] = 0;
7778         }
7779     }
7780
7781   /* If a segment was explicitly specified, and the specified segment
7782      is neither the default nor the one already recorded from a prefix,
7783      use an opcode prefix to select it.  If we never figured out what
7784      the default segment is, then default_seg will be zero at this
7785      point, and the specified segment prefix will always be used.  */
7786   if (i.seg[0]
7787       && i.seg[0] != default_seg
7788       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7789     {
7790       if (!add_prefix (i.seg[0]->seg_prefix))
7791         return 0;
7792     }
7793   return 1;
7794 }
7795
7796 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7797                                  bfd_boolean do_sse2avx)
7798 {
7799   if (r->reg_flags & RegRex)
7800     {
7801       if (i.rex & rex_bit)
7802         as_bad (_("same type of prefix used twice"));
7803       i.rex |= rex_bit;
7804     }
7805   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7806     {
7807       gas_assert (i.vex.register_specifier == r);
7808       i.vex.register_specifier += 8;
7809     }
7810
7811   if (r->reg_flags & RegVRex)
7812     i.vrex |= rex_bit;
7813 }
7814
7815 static const seg_entry *
7816 build_modrm_byte (void)
7817 {
7818   const seg_entry *default_seg = 0;
7819   unsigned int source, dest;
7820   int vex_3_sources;
7821
7822   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7823   if (vex_3_sources)
7824     {
7825       unsigned int nds, reg_slot;
7826       expressionS *exp;
7827
7828       dest = i.operands - 1;
7829       nds = dest - 1;
7830
7831       /* There are 2 kinds of instructions:
7832          1. 5 operands: 4 register operands or 3 register operands
7833          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7834          VexW0 or VexW1.  The destination must be either XMM, YMM or
7835          ZMM register.
7836          2. 4 operands: 4 register operands or 3 register operands
7837          plus 1 memory operand, with VexXDS.  */
7838       gas_assert ((i.reg_operands == 4
7839                    || (i.reg_operands == 3 && i.mem_operands == 1))
7840                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7841                   && i.tm.opcode_modifier.vexw
7842                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7843
7844       /* If VexW1 is set, the first non-immediate operand is the source and
7845          the second non-immediate one is encoded in the immediate operand.  */
7846       if (i.tm.opcode_modifier.vexw == VEXW1)
7847         {
7848           source = i.imm_operands;
7849           reg_slot = i.imm_operands + 1;
7850         }
7851       else
7852         {
7853           source = i.imm_operands + 1;
7854           reg_slot = i.imm_operands;
7855         }
7856
7857       if (i.imm_operands == 0)
7858         {
7859           /* When there is no immediate operand, generate an 8bit
7860              immediate operand to encode the first operand.  */
7861           exp = &im_expressions[i.imm_operands++];
7862           i.op[i.operands].imms = exp;
7863           i.types[i.operands] = imm8;
7864           i.operands++;
7865
7866           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7867           exp->X_op = O_constant;
7868           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7869           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7870         }
7871       else
7872         {
7873           gas_assert (i.imm_operands == 1);
7874           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7875           gas_assert (!i.tm.opcode_modifier.immext);
7876
7877           /* Turn on Imm8 again so that output_imm will generate it.  */
7878           i.types[0].bitfield.imm8 = 1;
7879
7880           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7881           i.op[0].imms->X_add_number
7882               |= register_number (i.op[reg_slot].regs) << 4;
7883           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7884         }
7885
7886       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7887       i.vex.register_specifier = i.op[nds].regs;
7888     }
7889   else
7890     source = dest = 0;
7891
7892   /* i.reg_operands MUST be the number of real register operands;
7893      implicit registers do not count.  If there are 3 register
7894      operands, it must be a instruction with VexNDS.  For a
7895      instruction with VexNDD, the destination register is encoded
7896      in VEX prefix.  If there are 4 register operands, it must be
7897      a instruction with VEX prefix and 3 sources.  */
7898   if (i.mem_operands == 0
7899       && ((i.reg_operands == 2
7900            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7901           || (i.reg_operands == 3
7902               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7903           || (i.reg_operands == 4 && vex_3_sources)))
7904     {
7905       switch (i.operands)
7906         {
7907         case 2:
7908           source = 0;
7909           break;
7910         case 3:
7911           /* When there are 3 operands, one of them may be immediate,
7912              which may be the first or the last operand.  Otherwise,
7913              the first operand must be shift count register (cl) or it
7914              is an instruction with VexNDS. */
7915           gas_assert (i.imm_operands == 1
7916                       || (i.imm_operands == 0
7917                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7918                               || (i.types[0].bitfield.instance == RegC
7919                                   && i.types[0].bitfield.byte))));
7920           if (operand_type_check (i.types[0], imm)
7921               || (i.types[0].bitfield.instance == RegC
7922                   && i.types[0].bitfield.byte))
7923             source = 1;
7924           else
7925             source = 0;
7926           break;
7927         case 4:
7928           /* When there are 4 operands, the first two must be 8bit
7929              immediate operands. The source operand will be the 3rd
7930              one.
7931
7932              For instructions with VexNDS, if the first operand
7933              an imm8, the source operand is the 2nd one.  If the last
7934              operand is imm8, the source operand is the first one.  */
7935           gas_assert ((i.imm_operands == 2
7936                        && i.types[0].bitfield.imm8
7937                        && i.types[1].bitfield.imm8)
7938                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7939                           && i.imm_operands == 1
7940                           && (i.types[0].bitfield.imm8
7941                               || i.types[i.operands - 1].bitfield.imm8
7942                               || i.rounding)));
7943           if (i.imm_operands == 2)
7944             source = 2;
7945           else
7946             {
7947               if (i.types[0].bitfield.imm8)
7948                 source = 1;
7949               else
7950                 source = 0;
7951             }
7952           break;
7953         case 5:
7954           if (is_evex_encoding (&i.tm))
7955             {
7956               /* For EVEX instructions, when there are 5 operands, the
7957                  first one must be immediate operand.  If the second one
7958                  is immediate operand, the source operand is the 3th
7959                  one.  If the last one is immediate operand, the source
7960                  operand is the 2nd one.  */
7961               gas_assert (i.imm_operands == 2
7962                           && i.tm.opcode_modifier.sae
7963                           && operand_type_check (i.types[0], imm));
7964               if (operand_type_check (i.types[1], imm))
7965                 source = 2;
7966               else if (operand_type_check (i.types[4], imm))
7967                 source = 1;
7968               else
7969                 abort ();
7970             }
7971           break;
7972         default:
7973           abort ();
7974         }
7975
7976       if (!vex_3_sources)
7977         {
7978           dest = source + 1;
7979
7980           /* RC/SAE operand could be between DEST and SRC.  That happens
7981              when one operand is GPR and the other one is XMM/YMM/ZMM
7982              register.  */
7983           if (i.rounding && i.rounding->operand == (int) dest)
7984             dest++;
7985
7986           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7987             {
7988               /* For instructions with VexNDS, the register-only source
7989                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7990                  register.  It is encoded in VEX prefix.  */
7991
7992               i386_operand_type op;
7993               unsigned int vvvv;
7994
7995               /* Swap two source operands if needed.  */
7996               if (i.tm.opcode_modifier.swapsources)
7997                 {
7998                   vvvv = source;
7999                   source = dest;
8000                 }
8001               else
8002                 vvvv = dest;
8003
8004               op = i.tm.operand_types[vvvv];
8005               if ((dest + 1) >= i.operands
8006                   || ((op.bitfield.class != Reg
8007                        || (!op.bitfield.dword && !op.bitfield.qword))
8008                       && op.bitfield.class != RegSIMD
8009                       && !operand_type_equal (&op, &regmask)))
8010                 abort ();
8011               i.vex.register_specifier = i.op[vvvv].regs;
8012               dest++;
8013             }
8014         }
8015
8016       i.rm.mode = 3;
8017       /* One of the register operands will be encoded in the i.rm.reg
8018          field, the other in the combined i.rm.mode and i.rm.regmem
8019          fields.  If no form of this instruction supports a memory
8020          destination operand, then we assume the source operand may
8021          sometimes be a memory operand and so we need to store the
8022          destination in the i.rm.reg field.  */
8023       if (!i.tm.opcode_modifier.regmem
8024           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
8025         {
8026           i.rm.reg = i.op[dest].regs->reg_num;
8027           i.rm.regmem = i.op[source].regs->reg_num;
8028           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
8029           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
8030         }
8031       else
8032         {
8033           i.rm.reg = i.op[source].regs->reg_num;
8034           i.rm.regmem = i.op[dest].regs->reg_num;
8035           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8036           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8037         }
8038       if (flag_code != CODE_64BIT && (i.rex & REX_R))
8039         {
8040           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8041             abort ();
8042           i.rex &= ~REX_R;
8043           add_prefix (LOCK_PREFIX_OPCODE);
8044         }
8045     }
8046   else
8047     {                   /* If it's not 2 reg operands...  */
8048       unsigned int mem;
8049
8050       if (i.mem_operands)
8051         {
8052           unsigned int fake_zero_displacement = 0;
8053           unsigned int op;
8054
8055           for (op = 0; op < i.operands; op++)
8056             if (i.flags[op] & Operand_Mem)
8057               break;
8058           gas_assert (op < i.operands);
8059
8060           if (i.tm.opcode_modifier.sib)
8061             {
8062               /* The index register of VSIB shouldn't be RegIZ.  */
8063               if (i.tm.opcode_modifier.sib != SIBMEM
8064                   && i.index_reg->reg_num == RegIZ)
8065                 abort ();
8066
8067               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8068               if (!i.base_reg)
8069                 {
8070                   i.sib.base = NO_BASE_REGISTER;
8071                   i.sib.scale = i.log2_scale_factor;
8072                   i.types[op].bitfield.disp8 = 0;
8073                   i.types[op].bitfield.disp16 = 0;
8074                   i.types[op].bitfield.disp64 = 0;
8075                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8076                     {
8077                       /* Must be 32 bit */
8078                       i.types[op].bitfield.disp32 = 1;
8079                       i.types[op].bitfield.disp32s = 0;
8080                     }
8081                   else
8082                     {
8083                       i.types[op].bitfield.disp32 = 0;
8084                       i.types[op].bitfield.disp32s = 1;
8085                     }
8086                 }
8087
8088               /* Since the mandatory SIB always has index register, so
8089                  the code logic remains unchanged. The non-mandatory SIB
8090                  without index register is allowed and will be handled
8091                  later.  */
8092               if (i.index_reg)
8093                 {
8094                   if (i.index_reg->reg_num == RegIZ)
8095                     i.sib.index = NO_INDEX_REGISTER;
8096                   else
8097                     i.sib.index = i.index_reg->reg_num;
8098                   set_rex_vrex (i.index_reg, REX_X, FALSE);
8099                 }
8100             }
8101
8102           default_seg = &ds;
8103
8104           if (i.base_reg == 0)
8105             {
8106               i.rm.mode = 0;
8107               if (!i.disp_operands)
8108                 fake_zero_displacement = 1;
8109               if (i.index_reg == 0)
8110                 {
8111                   i386_operand_type newdisp;
8112
8113                   /* Both check for VSIB and mandatory non-vector SIB. */
8114                   gas_assert (!i.tm.opcode_modifier.sib
8115                               || i.tm.opcode_modifier.sib == SIBMEM);
8116                   /* Operand is just <disp>  */
8117                   if (flag_code == CODE_64BIT)
8118                     {
8119                       /* 64bit mode overwrites the 32bit absolute
8120                          addressing by RIP relative addressing and
8121                          absolute addressing is encoded by one of the
8122                          redundant SIB forms.  */
8123                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8124                       i.sib.base = NO_BASE_REGISTER;
8125                       i.sib.index = NO_INDEX_REGISTER;
8126                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8127                     }
8128                   else if ((flag_code == CODE_16BIT)
8129                            ^ (i.prefix[ADDR_PREFIX] != 0))
8130                     {
8131                       i.rm.regmem = NO_BASE_REGISTER_16;
8132                       newdisp = disp16;
8133                     }
8134                   else
8135                     {
8136                       i.rm.regmem = NO_BASE_REGISTER;
8137                       newdisp = disp32;
8138                     }
8139                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8140                   i.types[op] = operand_type_or (i.types[op], newdisp);
8141                 }
8142               else if (!i.tm.opcode_modifier.sib)
8143                 {
8144                   /* !i.base_reg && i.index_reg  */
8145                   if (i.index_reg->reg_num == RegIZ)
8146                     i.sib.index = NO_INDEX_REGISTER;
8147                   else
8148                     i.sib.index = i.index_reg->reg_num;
8149                   i.sib.base = NO_BASE_REGISTER;
8150                   i.sib.scale = i.log2_scale_factor;
8151                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8152                   i.types[op].bitfield.disp8 = 0;
8153                   i.types[op].bitfield.disp16 = 0;
8154                   i.types[op].bitfield.disp64 = 0;
8155                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8156                     {
8157                       /* Must be 32 bit */
8158                       i.types[op].bitfield.disp32 = 1;
8159                       i.types[op].bitfield.disp32s = 0;
8160                     }
8161                   else
8162                     {
8163                       i.types[op].bitfield.disp32 = 0;
8164                       i.types[op].bitfield.disp32s = 1;
8165                     }
8166                   if ((i.index_reg->reg_flags & RegRex) != 0)
8167                     i.rex |= REX_X;
8168                 }
8169             }
8170           /* RIP addressing for 64bit mode.  */
8171           else if (i.base_reg->reg_num == RegIP)
8172             {
8173               gas_assert (!i.tm.opcode_modifier.sib);
8174               i.rm.regmem = NO_BASE_REGISTER;
8175               i.types[op].bitfield.disp8 = 0;
8176               i.types[op].bitfield.disp16 = 0;
8177               i.types[op].bitfield.disp32 = 0;
8178               i.types[op].bitfield.disp32s = 1;
8179               i.types[op].bitfield.disp64 = 0;
8180               i.flags[op] |= Operand_PCrel;
8181               if (! i.disp_operands)
8182                 fake_zero_displacement = 1;
8183             }
8184           else if (i.base_reg->reg_type.bitfield.word)
8185             {
8186               gas_assert (!i.tm.opcode_modifier.sib);
8187               switch (i.base_reg->reg_num)
8188                 {
8189                 case 3: /* (%bx)  */
8190                   if (i.index_reg == 0)
8191                     i.rm.regmem = 7;
8192                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8193                     i.rm.regmem = i.index_reg->reg_num - 6;
8194                   break;
8195                 case 5: /* (%bp)  */
8196                   default_seg = &ss;
8197                   if (i.index_reg == 0)
8198                     {
8199                       i.rm.regmem = 6;
8200                       if (operand_type_check (i.types[op], disp) == 0)
8201                         {
8202                           /* fake (%bp) into 0(%bp)  */
8203                           if (i.disp_encoding == disp_encoding_16bit)
8204                             i.types[op].bitfield.disp16 = 1;
8205                           else
8206                             i.types[op].bitfield.disp8 = 1;
8207                           fake_zero_displacement = 1;
8208                         }
8209                     }
8210                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8211                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8212                   break;
8213                 default: /* (%si) -> 4 or (%di) -> 5  */
8214                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8215                 }
8216               if (!fake_zero_displacement
8217                   && !i.disp_operands
8218                   && i.disp_encoding)
8219                 {
8220                   fake_zero_displacement = 1;
8221                   if (i.disp_encoding == disp_encoding_8bit)
8222                     i.types[op].bitfield.disp8 = 1;
8223                   else
8224                     i.types[op].bitfield.disp16 = 1;
8225                 }
8226               i.rm.mode = mode_from_disp_size (i.types[op]);
8227             }
8228           else /* i.base_reg and 32/64 bit mode  */
8229             {
8230               if (flag_code == CODE_64BIT
8231                   && operand_type_check (i.types[op], disp))
8232                 {
8233                   i.types[op].bitfield.disp16 = 0;
8234                   i.types[op].bitfield.disp64 = 0;
8235                   if (i.prefix[ADDR_PREFIX] == 0)
8236                     {
8237                       i.types[op].bitfield.disp32 = 0;
8238                       i.types[op].bitfield.disp32s = 1;
8239                     }
8240                   else
8241                     {
8242                       i.types[op].bitfield.disp32 = 1;
8243                       i.types[op].bitfield.disp32s = 0;
8244                     }
8245                 }
8246
8247               if (!i.tm.opcode_modifier.sib)
8248                 i.rm.regmem = i.base_reg->reg_num;
8249               if ((i.base_reg->reg_flags & RegRex) != 0)
8250                 i.rex |= REX_B;
8251               i.sib.base = i.base_reg->reg_num;
8252               /* x86-64 ignores REX prefix bit here to avoid decoder
8253                  complications.  */
8254               if (!(i.base_reg->reg_flags & RegRex)
8255                   && (i.base_reg->reg_num == EBP_REG_NUM
8256                    || i.base_reg->reg_num == ESP_REG_NUM))
8257                   default_seg = &ss;
8258               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8259                 {
8260                   fake_zero_displacement = 1;
8261                   if (i.disp_encoding == disp_encoding_32bit)
8262                     i.types[op].bitfield.disp32 = 1;
8263                   else
8264                     i.types[op].bitfield.disp8 = 1;
8265                 }
8266               i.sib.scale = i.log2_scale_factor;
8267               if (i.index_reg == 0)
8268                 {
8269                   /* Only check for VSIB. */
8270                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8271                               && i.tm.opcode_modifier.sib != VECSIB256
8272                               && i.tm.opcode_modifier.sib != VECSIB512);
8273
8274                   /* <disp>(%esp) becomes two byte modrm with no index
8275                      register.  We've already stored the code for esp
8276                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8277                      Any base register besides %esp will not use the
8278                      extra modrm byte.  */
8279                   i.sib.index = NO_INDEX_REGISTER;
8280                 }
8281               else if (!i.tm.opcode_modifier.sib)
8282                 {
8283                   if (i.index_reg->reg_num == RegIZ)
8284                     i.sib.index = NO_INDEX_REGISTER;
8285                   else
8286                     i.sib.index = i.index_reg->reg_num;
8287                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8288                   if ((i.index_reg->reg_flags & RegRex) != 0)
8289                     i.rex |= REX_X;
8290                 }
8291
8292               if (i.disp_operands
8293                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8294                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8295                 i.rm.mode = 0;
8296               else
8297                 {
8298                   if (!fake_zero_displacement
8299                       && !i.disp_operands
8300                       && i.disp_encoding)
8301                     {
8302                       fake_zero_displacement = 1;
8303                       if (i.disp_encoding == disp_encoding_8bit)
8304                         i.types[op].bitfield.disp8 = 1;
8305                       else
8306                         i.types[op].bitfield.disp32 = 1;
8307                     }
8308                   i.rm.mode = mode_from_disp_size (i.types[op]);
8309                 }
8310             }
8311
8312           if (fake_zero_displacement)
8313             {
8314               /* Fakes a zero displacement assuming that i.types[op]
8315                  holds the correct displacement size.  */
8316               expressionS *exp;
8317
8318               gas_assert (i.op[op].disps == 0);
8319               exp = &disp_expressions[i.disp_operands++];
8320               i.op[op].disps = exp;
8321               exp->X_op = O_constant;
8322               exp->X_add_number = 0;
8323               exp->X_add_symbol = (symbolS *) 0;
8324               exp->X_op_symbol = (symbolS *) 0;
8325             }
8326
8327           mem = op;
8328         }
8329       else
8330         mem = ~0;
8331
8332       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8333         {
8334           if (operand_type_check (i.types[0], imm))
8335             i.vex.register_specifier = NULL;
8336           else
8337             {
8338               /* VEX.vvvv encodes one of the sources when the first
8339                  operand is not an immediate.  */
8340               if (i.tm.opcode_modifier.vexw == VEXW0)
8341                 i.vex.register_specifier = i.op[0].regs;
8342               else
8343                 i.vex.register_specifier = i.op[1].regs;
8344             }
8345
8346           /* Destination is a XMM register encoded in the ModRM.reg
8347              and VEX.R bit.  */
8348           i.rm.reg = i.op[2].regs->reg_num;
8349           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8350             i.rex |= REX_R;
8351
8352           /* ModRM.rm and VEX.B encodes the other source.  */
8353           if (!i.mem_operands)
8354             {
8355               i.rm.mode = 3;
8356
8357               if (i.tm.opcode_modifier.vexw == VEXW0)
8358                 i.rm.regmem = i.op[1].regs->reg_num;
8359               else
8360                 i.rm.regmem = i.op[0].regs->reg_num;
8361
8362               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8363                 i.rex |= REX_B;
8364             }
8365         }
8366       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8367         {
8368           i.vex.register_specifier = i.op[2].regs;
8369           if (!i.mem_operands)
8370             {
8371               i.rm.mode = 3;
8372               i.rm.regmem = i.op[1].regs->reg_num;
8373               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8374                 i.rex |= REX_B;
8375             }
8376         }
8377       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8378          (if any) based on i.tm.extension_opcode.  Again, we must be
8379          careful to make sure that segment/control/debug/test/MMX
8380          registers are coded into the i.rm.reg field.  */
8381       else if (i.reg_operands)
8382         {
8383           unsigned int op;
8384           unsigned int vex_reg = ~0;
8385
8386           for (op = 0; op < i.operands; op++)
8387             if (i.types[op].bitfield.class == Reg
8388                 || i.types[op].bitfield.class == RegBND
8389                 || i.types[op].bitfield.class == RegMask
8390                 || i.types[op].bitfield.class == SReg
8391                 || i.types[op].bitfield.class == RegCR
8392                 || i.types[op].bitfield.class == RegDR
8393                 || i.types[op].bitfield.class == RegTR
8394                 || i.types[op].bitfield.class == RegSIMD
8395                 || i.types[op].bitfield.class == RegMMX)
8396               break;
8397
8398           if (vex_3_sources)
8399             op = dest;
8400           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8401             {
8402               /* For instructions with VexNDS, the register-only
8403                  source operand is encoded in VEX prefix. */
8404               gas_assert (mem != (unsigned int) ~0);
8405
8406               if (op > mem)
8407                 {
8408                   vex_reg = op++;
8409                   gas_assert (op < i.operands);
8410                 }
8411               else
8412                 {
8413                   /* Check register-only source operand when two source
8414                      operands are swapped.  */
8415                   if (!i.tm.operand_types[op].bitfield.baseindex
8416                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8417                     {
8418                       vex_reg = op;
8419                       op += 2;
8420                       gas_assert (mem == (vex_reg + 1)
8421                                   && op < i.operands);
8422                     }
8423                   else
8424                     {
8425                       vex_reg = op + 1;
8426                       gas_assert (vex_reg < i.operands);
8427                     }
8428                 }
8429             }
8430           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8431             {
8432               /* For instructions with VexNDD, the register destination
8433                  is encoded in VEX prefix.  */
8434               if (i.mem_operands == 0)
8435                 {
8436                   /* There is no memory operand.  */
8437                   gas_assert ((op + 2) == i.operands);
8438                   vex_reg = op + 1;
8439                 }
8440               else
8441                 {
8442                   /* There are only 2 non-immediate operands.  */
8443                   gas_assert (op < i.imm_operands + 2
8444                               && i.operands == i.imm_operands + 2);
8445                   vex_reg = i.imm_operands + 1;
8446                 }
8447             }
8448           else
8449             gas_assert (op < i.operands);
8450
8451           if (vex_reg != (unsigned int) ~0)
8452             {
8453               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8454
8455               if ((type->bitfield.class != Reg
8456                    || (!type->bitfield.dword && !type->bitfield.qword))
8457                   && type->bitfield.class != RegSIMD
8458                   && !operand_type_equal (type, &regmask))
8459                 abort ();
8460
8461               i.vex.register_specifier = i.op[vex_reg].regs;
8462             }
8463
8464           /* Don't set OP operand twice.  */
8465           if (vex_reg != op)
8466             {
8467               /* If there is an extension opcode to put here, the
8468                  register number must be put into the regmem field.  */
8469               if (i.tm.extension_opcode != None)
8470                 {
8471                   i.rm.regmem = i.op[op].regs->reg_num;
8472                   set_rex_vrex (i.op[op].regs, REX_B,
8473                                 i.tm.opcode_modifier.sse2avx);
8474                 }
8475               else
8476                 {
8477                   i.rm.reg = i.op[op].regs->reg_num;
8478                   set_rex_vrex (i.op[op].regs, REX_R,
8479                                 i.tm.opcode_modifier.sse2avx);
8480                 }
8481             }
8482
8483           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8484              must set it to 3 to indicate this is a register operand
8485              in the regmem field.  */
8486           if (!i.mem_operands)
8487             i.rm.mode = 3;
8488         }
8489
8490       /* Fill in i.rm.reg field with extension opcode (if any).  */
8491       if (i.tm.extension_opcode != None)
8492         i.rm.reg = i.tm.extension_opcode;
8493     }
8494   return default_seg;
8495 }
8496
8497 static INLINE void
8498 frag_opcode_byte (unsigned char byte)
8499 {
8500   if (now_seg != absolute_section)
8501     FRAG_APPEND_1_CHAR (byte);
8502   else
8503     ++abs_section_offset;
8504 }
8505
8506 static unsigned int
8507 flip_code16 (unsigned int code16)
8508 {
8509   gas_assert (i.tm.operands == 1);
8510
8511   return !(i.prefix[REX_PREFIX] & REX_W)
8512          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8513                       || i.tm.operand_types[0].bitfield.disp32s
8514                     : i.tm.operand_types[0].bitfield.disp16)
8515          ? CODE16 : 0;
8516 }
8517
8518 static void
8519 output_branch (void)
8520 {
8521   char *p;
8522   int size;
8523   int code16;
8524   int prefix;
8525   relax_substateT subtype;
8526   symbolS *sym;
8527   offsetT off;
8528
8529   if (now_seg == absolute_section)
8530     {
8531       as_bad (_("relaxable branches not supported in absolute section"));
8532       return;
8533     }
8534
8535   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8536   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8537
8538   prefix = 0;
8539   if (i.prefix[DATA_PREFIX] != 0)
8540     {
8541       prefix = 1;
8542       i.prefixes -= 1;
8543       code16 ^= flip_code16(code16);
8544     }
8545   /* Pentium4 branch hints.  */
8546   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8547       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8548     {
8549       prefix++;
8550       i.prefixes--;
8551     }
8552   if (i.prefix[REX_PREFIX] != 0)
8553     {
8554       prefix++;
8555       i.prefixes--;
8556     }
8557
8558   /* BND prefixed jump.  */
8559   if (i.prefix[BND_PREFIX] != 0)
8560     {
8561       prefix++;
8562       i.prefixes--;
8563     }
8564
8565   if (i.prefixes != 0)
8566     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8567
8568   /* It's always a symbol;  End frag & setup for relax.
8569      Make sure there is enough room in this frag for the largest
8570      instruction we may generate in md_convert_frag.  This is 2
8571      bytes for the opcode and room for the prefix and largest
8572      displacement.  */
8573   frag_grow (prefix + 2 + 4);
8574   /* Prefix and 1 opcode byte go in fr_fix.  */
8575   p = frag_more (prefix + 1);
8576   if (i.prefix[DATA_PREFIX] != 0)
8577     *p++ = DATA_PREFIX_OPCODE;
8578   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8579       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8580     *p++ = i.prefix[SEG_PREFIX];
8581   if (i.prefix[BND_PREFIX] != 0)
8582     *p++ = BND_PREFIX_OPCODE;
8583   if (i.prefix[REX_PREFIX] != 0)
8584     *p++ = i.prefix[REX_PREFIX];
8585   *p = i.tm.base_opcode;
8586
8587   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8588     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8589   else if (cpu_arch_flags.bitfield.cpui386)
8590     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8591   else
8592     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8593   subtype |= code16;
8594
8595   sym = i.op[0].disps->X_add_symbol;
8596   off = i.op[0].disps->X_add_number;
8597
8598   if (i.op[0].disps->X_op != O_constant
8599       && i.op[0].disps->X_op != O_symbol)
8600     {
8601       /* Handle complex expressions.  */
8602       sym = make_expr_symbol (i.op[0].disps);
8603       off = 0;
8604     }
8605
8606   /* 1 possible extra opcode + 4 byte displacement go in var part.
8607      Pass reloc in fr_var.  */
8608   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8609 }
8610
8611 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8612 /* Return TRUE iff PLT32 relocation should be used for branching to
8613    symbol S.  */
8614
8615 static bfd_boolean
8616 need_plt32_p (symbolS *s)
8617 {
8618   /* PLT32 relocation is ELF only.  */
8619   if (!IS_ELF)
8620     return FALSE;
8621
8622 #ifdef TE_SOLARIS
8623   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8624      krtld support it.  */
8625   return FALSE;
8626 #endif
8627
8628   /* Since there is no need to prepare for PLT branch on x86-64, we
8629      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8630      be used as a marker for 32-bit PC-relative branches.  */
8631   if (!object_64bit)
8632     return FALSE;
8633
8634   if (s == NULL)
8635     return FALSE;
8636
8637   /* Weak or undefined symbol need PLT32 relocation.  */
8638   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8639     return TRUE;
8640
8641   /* Non-global symbol doesn't need PLT32 relocation.  */
8642   if (! S_IS_EXTERNAL (s))
8643     return FALSE;
8644
8645   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8646      non-default visibilities are treated as normal global symbol
8647      so that PLT32 relocation can be used as a marker for 32-bit
8648      PC-relative branches.  It is useful for linker relaxation.  */
8649   return TRUE;
8650 }
8651 #endif
8652
8653 static void
8654 output_jump (void)
8655 {
8656   char *p;
8657   int size;
8658   fixS *fixP;
8659   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8660
8661   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8662     {
8663       /* This is a loop or jecxz type instruction.  */
8664       size = 1;
8665       if (i.prefix[ADDR_PREFIX] != 0)
8666         {
8667           frag_opcode_byte (ADDR_PREFIX_OPCODE);
8668           i.prefixes -= 1;
8669         }
8670       /* Pentium4 branch hints.  */
8671       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8672           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8673         {
8674           frag_opcode_byte (i.prefix[SEG_PREFIX]);
8675           i.prefixes--;
8676         }
8677     }
8678   else
8679     {
8680       int code16;
8681
8682       code16 = 0;
8683       if (flag_code == CODE_16BIT)
8684         code16 = CODE16;
8685
8686       if (i.prefix[DATA_PREFIX] != 0)
8687         {
8688           frag_opcode_byte (DATA_PREFIX_OPCODE);
8689           i.prefixes -= 1;
8690           code16 ^= flip_code16(code16);
8691         }
8692
8693       size = 4;
8694       if (code16)
8695         size = 2;
8696     }
8697
8698   /* BND prefixed jump.  */
8699   if (i.prefix[BND_PREFIX] != 0)
8700     {
8701       frag_opcode_byte (i.prefix[BND_PREFIX]);
8702       i.prefixes -= 1;
8703     }
8704
8705   if (i.prefix[REX_PREFIX] != 0)
8706     {
8707       frag_opcode_byte (i.prefix[REX_PREFIX]);
8708       i.prefixes -= 1;
8709     }
8710
8711   if (i.prefixes != 0)
8712     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8713
8714   if (now_seg == absolute_section)
8715     {
8716       abs_section_offset += i.tm.opcode_length + size;
8717       return;
8718     }
8719
8720   p = frag_more (i.tm.opcode_length + size);
8721   switch (i.tm.opcode_length)
8722     {
8723     case 2:
8724       *p++ = i.tm.base_opcode >> 8;
8725       /* Fall through.  */
8726     case 1:
8727       *p++ = i.tm.base_opcode;
8728       break;
8729     default:
8730       abort ();
8731     }
8732
8733 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8734   if (size == 4
8735       && jump_reloc == NO_RELOC
8736       && need_plt32_p (i.op[0].disps->X_add_symbol))
8737     jump_reloc = BFD_RELOC_X86_64_PLT32;
8738 #endif
8739
8740   jump_reloc = reloc (size, 1, 1, jump_reloc);
8741
8742   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8743                       i.op[0].disps, 1, jump_reloc);
8744
8745   /* All jumps handled here are signed, but don't use a signed limit
8746      check for 32 and 16 bit jumps as we want to allow wrap around at
8747      4G and 64k respectively.  */
8748   if (size == 1)
8749     fixP->fx_signed = 1;
8750 }
8751
8752 static void
8753 output_interseg_jump (void)
8754 {
8755   char *p;
8756   int size;
8757   int prefix;
8758   int code16;
8759
8760   code16 = 0;
8761   if (flag_code == CODE_16BIT)
8762     code16 = CODE16;
8763
8764   prefix = 0;
8765   if (i.prefix[DATA_PREFIX] != 0)
8766     {
8767       prefix = 1;
8768       i.prefixes -= 1;
8769       code16 ^= CODE16;
8770     }
8771
8772   gas_assert (!i.prefix[REX_PREFIX]);
8773
8774   size = 4;
8775   if (code16)
8776     size = 2;
8777
8778   if (i.prefixes != 0)
8779     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8780
8781   if (now_seg == absolute_section)
8782     {
8783       abs_section_offset += prefix + 1 + 2 + size;
8784       return;
8785     }
8786
8787   /* 1 opcode; 2 segment; offset  */
8788   p = frag_more (prefix + 1 + 2 + size);
8789
8790   if (i.prefix[DATA_PREFIX] != 0)
8791     *p++ = DATA_PREFIX_OPCODE;
8792
8793   if (i.prefix[REX_PREFIX] != 0)
8794     *p++ = i.prefix[REX_PREFIX];
8795
8796   *p++ = i.tm.base_opcode;
8797   if (i.op[1].imms->X_op == O_constant)
8798     {
8799       offsetT n = i.op[1].imms->X_add_number;
8800
8801       if (size == 2
8802           && !fits_in_unsigned_word (n)
8803           && !fits_in_signed_word (n))
8804         {
8805           as_bad (_("16-bit jump out of range"));
8806           return;
8807         }
8808       md_number_to_chars (p, n, size);
8809     }
8810   else
8811     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8812                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8813
8814   p += size;
8815   if (i.op[0].imms->X_op == O_constant)
8816     md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8817   else
8818     fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8819                  i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8820 }
8821
8822 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8823 void
8824 x86_cleanup (void)
8825 {
8826   char *p;
8827   asection *seg = now_seg;
8828   subsegT subseg = now_subseg;
8829   asection *sec;
8830   unsigned int alignment, align_size_1;
8831   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8832   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8833   unsigned int padding;
8834
8835   if (!IS_ELF || !x86_used_note)
8836     return;
8837
8838   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8839
8840   /* The .note.gnu.property section layout:
8841
8842      Field      Length          Contents
8843      ----       ----            ----
8844      n_namsz    4               4
8845      n_descsz   4               The note descriptor size
8846      n_type     4               NT_GNU_PROPERTY_TYPE_0
8847      n_name     4               "GNU"
8848      n_desc     n_descsz        The program property array
8849      ....       ....            ....
8850    */
8851
8852   /* Create the .note.gnu.property section.  */
8853   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8854   bfd_set_section_flags (sec,
8855                          (SEC_ALLOC
8856                           | SEC_LOAD
8857                           | SEC_DATA
8858                           | SEC_HAS_CONTENTS
8859                           | SEC_READONLY));
8860
8861   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8862     {
8863       align_size_1 = 7;
8864       alignment = 3;
8865     }
8866   else
8867     {
8868       align_size_1 = 3;
8869       alignment = 2;
8870     }
8871
8872   bfd_set_section_alignment (sec, alignment);
8873   elf_section_type (sec) = SHT_NOTE;
8874
8875   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8876                                   + 4-byte data  */
8877   isa_1_descsz_raw = 4 + 4 + 4;
8878   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8879   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8880
8881   feature_2_descsz_raw = isa_1_descsz;
8882   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8883                                       + 4-byte data  */
8884   feature_2_descsz_raw += 4 + 4 + 4;
8885   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8886   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8887                       & ~align_size_1);
8888
8889   descsz = feature_2_descsz;
8890   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8891   p = frag_more (4 + 4 + 4 + 4 + descsz);
8892
8893   /* Write n_namsz.  */
8894   md_number_to_chars (p, (valueT) 4, 4);
8895
8896   /* Write n_descsz.  */
8897   md_number_to_chars (p + 4, (valueT) descsz, 4);
8898
8899   /* Write n_type.  */
8900   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8901
8902   /* Write n_name.  */
8903   memcpy (p + 4 * 3, "GNU", 4);
8904
8905   /* Write 4-byte type.  */
8906   md_number_to_chars (p + 4 * 4,
8907                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8908
8909   /* Write 4-byte data size.  */
8910   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8911
8912   /* Write 4-byte data.  */
8913   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8914
8915   /* Zero out paddings.  */
8916   padding = isa_1_descsz - isa_1_descsz_raw;
8917   if (padding)
8918     memset (p + 4 * 7, 0, padding);
8919
8920   /* Write 4-byte type.  */
8921   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8922                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8923
8924   /* Write 4-byte data size.  */
8925   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8926
8927   /* Write 4-byte data.  */
8928   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8929                       (valueT) x86_feature_2_used, 4);
8930
8931   /* Zero out paddings.  */
8932   padding = feature_2_descsz - feature_2_descsz_raw;
8933   if (padding)
8934     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8935
8936   /* We probably can't restore the current segment, for there likely
8937      isn't one yet...  */
8938   if (seg && subseg)
8939     subseg_set (seg, subseg);
8940 }
8941 #endif
8942
8943 static unsigned int
8944 encoding_length (const fragS *start_frag, offsetT start_off,
8945                  const char *frag_now_ptr)
8946 {
8947   unsigned int len = 0;
8948
8949   if (start_frag != frag_now)
8950     {
8951       const fragS *fr = start_frag;
8952
8953       do {
8954         len += fr->fr_fix;
8955         fr = fr->fr_next;
8956       } while (fr && fr != frag_now);
8957     }
8958
8959   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8960 }
8961
8962 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8963    be macro-fused with conditional jumps.
8964    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8965    or is one of the following format:
8966
8967     cmp m, imm
8968     add m, imm
8969     sub m, imm
8970    test m, imm
8971     and m, imm
8972     inc m
8973     dec m
8974
8975    it is unfusible.  */
8976
8977 static int
8978 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8979 {
8980   /* No RIP address.  */
8981   if (i.base_reg && i.base_reg->reg_num == RegIP)
8982     return 0;
8983
8984   /* No VEX/EVEX encoding.  */
8985   if (is_any_vex_encoding (&i.tm))
8986     return 0;
8987
8988   /* add, sub without add/sub m, imm.  */
8989   if (i.tm.base_opcode <= 5
8990       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8991       || ((i.tm.base_opcode | 3) == 0x83
8992           && (i.tm.extension_opcode == 0x5
8993               || i.tm.extension_opcode == 0x0)))
8994     {
8995       *mf_cmp_p = mf_cmp_alu_cmp;
8996       return !(i.mem_operands && i.imm_operands);
8997     }
8998
8999   /* and without and m, imm.  */
9000   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
9001       || ((i.tm.base_opcode | 3) == 0x83
9002           && i.tm.extension_opcode == 0x4))
9003     {
9004       *mf_cmp_p = mf_cmp_test_and;
9005       return !(i.mem_operands && i.imm_operands);
9006     }
9007
9008   /* test without test m imm.  */
9009   if ((i.tm.base_opcode | 1) == 0x85
9010       || (i.tm.base_opcode | 1) == 0xa9
9011       || ((i.tm.base_opcode | 1) == 0xf7
9012           && i.tm.extension_opcode == 0))
9013     {
9014       *mf_cmp_p = mf_cmp_test_and;
9015       return !(i.mem_operands && i.imm_operands);
9016     }
9017
9018   /* cmp without cmp m, imm.  */
9019   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
9020       || ((i.tm.base_opcode | 3) == 0x83
9021           && (i.tm.extension_opcode == 0x7)))
9022     {
9023       *mf_cmp_p = mf_cmp_alu_cmp;
9024       return !(i.mem_operands && i.imm_operands);
9025     }
9026
9027   /* inc, dec without inc/dec m.   */
9028   if ((i.tm.cpu_flags.bitfield.cpuno64
9029        && (i.tm.base_opcode | 0xf) == 0x4f)
9030       || ((i.tm.base_opcode | 1) == 0xff
9031           && i.tm.extension_opcode <= 0x1))
9032     {
9033       *mf_cmp_p = mf_cmp_incdec;
9034       return !i.mem_operands;
9035     }
9036
9037   return 0;
9038 }
9039
9040 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
9041
9042 static int
9043 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9044 {
9045   /* NB: Don't work with COND_JUMP86 without i386.  */
9046   if (!align_branch_power
9047       || now_seg == absolute_section
9048       || !cpu_arch_flags.bitfield.cpui386
9049       || !(align_branch & align_branch_fused_bit))
9050     return 0;
9051
9052   if (maybe_fused_with_jcc_p (mf_cmp_p))
9053     {
9054       if (last_insn.kind == last_insn_other
9055           || last_insn.seg != now_seg)
9056         return 1;
9057       if (flag_debug)
9058         as_warn_where (last_insn.file, last_insn.line,
9059                        _("`%s` skips -malign-branch-boundary on `%s`"),
9060                        last_insn.name, i.tm.name);
9061     }
9062
9063   return 0;
9064 }
9065
9066 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9067
9068 static int
9069 add_branch_prefix_frag_p (void)
9070 {
9071   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9072      to PadLock instructions since they include prefixes in opcode.  */
9073   if (!align_branch_power
9074       || !align_branch_prefix_size
9075       || now_seg == absolute_section
9076       || i.tm.cpu_flags.bitfield.cpupadlock
9077       || !cpu_arch_flags.bitfield.cpui386)
9078     return 0;
9079
9080   /* Don't add prefix if it is a prefix or there is no operand in case
9081      that segment prefix is special.  */
9082   if (!i.operands || i.tm.opcode_modifier.isprefix)
9083     return 0;
9084
9085   if (last_insn.kind == last_insn_other
9086       || last_insn.seg != now_seg)
9087     return 1;
9088
9089   if (flag_debug)
9090     as_warn_where (last_insn.file, last_insn.line,
9091                    _("`%s` skips -malign-branch-boundary on `%s`"),
9092                    last_insn.name, i.tm.name);
9093
9094   return 0;
9095 }
9096
9097 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9098
9099 static int
9100 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9101                            enum mf_jcc_kind *mf_jcc_p)
9102 {
9103   int add_padding;
9104
9105   /* NB: Don't work with COND_JUMP86 without i386.  */
9106   if (!align_branch_power
9107       || now_seg == absolute_section
9108       || !cpu_arch_flags.bitfield.cpui386)
9109     return 0;
9110
9111   add_padding = 0;
9112
9113   /* Check for jcc and direct jmp.  */
9114   if (i.tm.opcode_modifier.jump == JUMP)
9115     {
9116       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9117         {
9118           *branch_p = align_branch_jmp;
9119           add_padding = align_branch & align_branch_jmp_bit;
9120         }
9121       else
9122         {
9123           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9124              igore the lowest bit.  */
9125           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9126           *branch_p = align_branch_jcc;
9127           if ((align_branch & align_branch_jcc_bit))
9128             add_padding = 1;
9129         }
9130     }
9131   else if (is_any_vex_encoding (&i.tm))
9132     return 0;
9133   else if ((i.tm.base_opcode | 1) == 0xc3)
9134     {
9135       /* Near ret.  */
9136       *branch_p = align_branch_ret;
9137       if ((align_branch & align_branch_ret_bit))
9138         add_padding = 1;
9139     }
9140   else
9141     {
9142       /* Check for indirect jmp, direct and indirect calls.  */
9143       if (i.tm.base_opcode == 0xe8)
9144         {
9145           /* Direct call.  */
9146           *branch_p = align_branch_call;
9147           if ((align_branch & align_branch_call_bit))
9148             add_padding = 1;
9149         }
9150       else if (i.tm.base_opcode == 0xff
9151                && (i.tm.extension_opcode == 2
9152                    || i.tm.extension_opcode == 4))
9153         {
9154           /* Indirect call and jmp.  */
9155           *branch_p = align_branch_indirect;
9156           if ((align_branch & align_branch_indirect_bit))
9157             add_padding = 1;
9158         }
9159
9160       if (add_padding
9161           && i.disp_operands
9162           && tls_get_addr
9163           && (i.op[0].disps->X_op == O_symbol
9164               || (i.op[0].disps->X_op == O_subtract
9165                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9166         {
9167           symbolS *s = i.op[0].disps->X_add_symbol;
9168           /* No padding to call to global or undefined tls_get_addr.  */
9169           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9170               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9171             return 0;
9172         }
9173     }
9174
9175   if (add_padding
9176       && last_insn.kind != last_insn_other
9177       && last_insn.seg == now_seg)
9178     {
9179       if (flag_debug)
9180         as_warn_where (last_insn.file, last_insn.line,
9181                        _("`%s` skips -malign-branch-boundary on `%s`"),
9182                        last_insn.name, i.tm.name);
9183       return 0;
9184     }
9185
9186   return add_padding;
9187 }
9188
9189 static void
9190 output_insn (void)
9191 {
9192   fragS *insn_start_frag;
9193   offsetT insn_start_off;
9194   fragS *fragP = NULL;
9195   enum align_branch_kind branch = align_branch_none;
9196   /* The initializer is arbitrary just to avoid uninitialized error.
9197      it's actually either assigned in add_branch_padding_frag_p
9198      or never be used.  */
9199   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9200
9201 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9202   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9203     {
9204       if ((i.xstate & xstate_tmm) == xstate_tmm
9205           || i.tm.cpu_flags.bitfield.cpuamx_tile)
9206         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9207
9208       if (i.tm.cpu_flags.bitfield.cpu8087
9209           || i.tm.cpu_flags.bitfield.cpu287
9210           || i.tm.cpu_flags.bitfield.cpu387
9211           || i.tm.cpu_flags.bitfield.cpu687
9212           || i.tm.cpu_flags.bitfield.cpufisttp)
9213         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9214
9215       if ((i.xstate & xstate_mmx)
9216           || i.tm.base_opcode == 0xf77 /* emms */
9217           || i.tm.base_opcode == 0xf0e /* femms */)
9218         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9219
9220       if (i.index_reg)
9221         {
9222           if (i.index_reg->reg_type.bitfield.zmmword)
9223             i.xstate |= xstate_zmm;
9224           else if (i.index_reg->reg_type.bitfield.ymmword)
9225             i.xstate |= xstate_ymm;
9226           else if (i.index_reg->reg_type.bitfield.xmmword)
9227             i.xstate |= xstate_xmm;
9228         }
9229
9230       /* vzeroall / vzeroupper */
9231       if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9232         i.xstate |= xstate_ymm;
9233
9234       if ((i.xstate & xstate_xmm)
9235           /* ldmxcsr / stmxcsr */
9236           || (i.tm.base_opcode == 0xfae && i.tm.cpu_flags.bitfield.cpusse)
9237           /* vldmxcsr / vstmxcsr */
9238           || (i.tm.base_opcode == 0xae && i.tm.cpu_flags.bitfield.cpuavx)
9239           || i.tm.cpu_flags.bitfield.cpuwidekl
9240           || i.tm.cpu_flags.bitfield.cpukl)
9241         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9242
9243       if ((i.xstate & xstate_ymm) == xstate_ymm)
9244         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9245       if ((i.xstate & xstate_zmm) == xstate_zmm)
9246         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9247       if (i.mask || (i.xstate & xstate_mask) == xstate_mask)
9248         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9249       if (i.tm.cpu_flags.bitfield.cpufxsr)
9250         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9251       if (i.tm.cpu_flags.bitfield.cpuxsave)
9252         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9253       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9254         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9255       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9256         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9257
9258       if (x86_feature_2_used
9259           || i.tm.cpu_flags.bitfield.cpucmov
9260           || i.tm.cpu_flags.bitfield.cpusyscall
9261           || (i.tm.base_opcode == 0xfc7
9262               && i.tm.opcode_modifier.opcodeprefix == 0
9263               && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9264         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9265       if (i.tm.cpu_flags.bitfield.cpusse3
9266           || i.tm.cpu_flags.bitfield.cpussse3
9267           || i.tm.cpu_flags.bitfield.cpusse4_1
9268           || i.tm.cpu_flags.bitfield.cpusse4_2
9269           || i.tm.cpu_flags.bitfield.cpucx16
9270           || i.tm.cpu_flags.bitfield.cpupopcnt
9271           /* LAHF-SAHF insns in 64-bit mode.  */
9272           || (flag_code == CODE_64BIT
9273               && (i.tm.base_opcode | 1) == 0x9f))
9274         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9275       if (i.tm.cpu_flags.bitfield.cpuavx
9276           || i.tm.cpu_flags.bitfield.cpuavx2
9277           /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9278              CpuAVX512DQ, LPW, TBM and AMX.  */
9279           || (i.tm.opcode_modifier.vex
9280               && !i.tm.cpu_flags.bitfield.cpuavx512f
9281               && !i.tm.cpu_flags.bitfield.cpuavx512bw
9282               && !i.tm.cpu_flags.bitfield.cpuavx512dq
9283               && !i.tm.cpu_flags.bitfield.cpulwp
9284               && !i.tm.cpu_flags.bitfield.cputbm
9285               && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9286           || i.tm.cpu_flags.bitfield.cpuf16c
9287           || i.tm.cpu_flags.bitfield.cpufma
9288           || i.tm.cpu_flags.bitfield.cpulzcnt
9289           || i.tm.cpu_flags.bitfield.cpumovbe
9290           || i.tm.cpu_flags.bitfield.cpuxsaves
9291           || (x86_feature_2_used
9292               & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9293                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9294                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9295         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9296       if (i.tm.cpu_flags.bitfield.cpuavx512f
9297           || i.tm.cpu_flags.bitfield.cpuavx512bw
9298           || i.tm.cpu_flags.bitfield.cpuavx512dq
9299           || i.tm.cpu_flags.bitfield.cpuavx512vl
9300           /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9301              VNNIW.  */
9302           || (i.tm.opcode_modifier.evex
9303               && !i.tm.cpu_flags.bitfield.cpuavx512er
9304               && !i.tm.cpu_flags.bitfield.cpuavx512pf
9305               && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9306         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9307     }
9308 #endif
9309
9310   /* Tie dwarf2 debug info to the address at the start of the insn.
9311      We can't do this after the insn has been output as the current
9312      frag may have been closed off.  eg. by frag_var.  */
9313   dwarf2_emit_insn (0);
9314
9315   insn_start_frag = frag_now;
9316   insn_start_off = frag_now_fix ();
9317
9318   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9319     {
9320       char *p;
9321       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9322       unsigned int max_branch_padding_size = 14;
9323
9324       /* Align section to boundary.  */
9325       record_alignment (now_seg, align_branch_power);
9326
9327       /* Make room for padding.  */
9328       frag_grow (max_branch_padding_size);
9329
9330       /* Start of the padding.  */
9331       p = frag_more (0);
9332
9333       fragP = frag_now;
9334
9335       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9336                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9337                 NULL, 0, p);
9338
9339       fragP->tc_frag_data.mf_type = mf_jcc;
9340       fragP->tc_frag_data.branch_type = branch;
9341       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9342     }
9343
9344   /* Output jumps.  */
9345   if (i.tm.opcode_modifier.jump == JUMP)
9346     output_branch ();
9347   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9348            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9349     output_jump ();
9350   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9351     output_interseg_jump ();
9352   else
9353     {
9354       /* Output normal instructions here.  */
9355       char *p;
9356       unsigned char *q;
9357       unsigned int j;
9358       enum mf_cmp_kind mf_cmp;
9359
9360       if (avoid_fence
9361           && (i.tm.base_opcode == 0xfaee8
9362               || i.tm.base_opcode == 0xfaef0
9363               || i.tm.base_opcode == 0xfaef8))
9364         {
9365           /* Encode lfence, mfence, and sfence as
9366              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9367           if (now_seg != absolute_section)
9368             {
9369               offsetT val = 0x240483f0ULL;
9370
9371               p = frag_more (5);
9372               md_number_to_chars (p, val, 5);
9373             }
9374           else
9375             abs_section_offset += 5;
9376           return;
9377         }
9378
9379       /* Some processors fail on LOCK prefix. This options makes
9380          assembler ignore LOCK prefix and serves as a workaround.  */
9381       if (omit_lock_prefix)
9382         {
9383           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9384             return;
9385           i.prefix[LOCK_PREFIX] = 0;
9386         }
9387
9388       if (branch)
9389         /* Skip if this is a branch.  */
9390         ;
9391       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9392         {
9393           /* Make room for padding.  */
9394           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9395           p = frag_more (0);
9396
9397           fragP = frag_now;
9398
9399           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9400                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9401                     NULL, 0, p);
9402
9403           fragP->tc_frag_data.mf_type = mf_cmp;
9404           fragP->tc_frag_data.branch_type = align_branch_fused;
9405           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9406         }
9407       else if (add_branch_prefix_frag_p ())
9408         {
9409           unsigned int max_prefix_size = align_branch_prefix_size;
9410
9411           /* Make room for padding.  */
9412           frag_grow (max_prefix_size);
9413           p = frag_more (0);
9414
9415           fragP = frag_now;
9416
9417           frag_var (rs_machine_dependent, max_prefix_size, 0,
9418                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9419                     NULL, 0, p);
9420
9421           fragP->tc_frag_data.max_bytes = max_prefix_size;
9422         }
9423
9424       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9425          don't need the explicit prefix.  */
9426       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9427         {
9428           switch (i.tm.opcode_modifier.opcodeprefix)
9429             {
9430             case PREFIX_0X66:
9431               add_prefix (0x66);
9432               break;
9433             case PREFIX_0XF2:
9434               add_prefix (0xf2);
9435               break;
9436             case PREFIX_0XF3:
9437               if (!i.tm.cpu_flags.bitfield.cpupadlock
9438                   || (i.prefix[REP_PREFIX] != 0xf3))
9439                 add_prefix (0xf3);
9440               break;
9441             case PREFIX_NONE:
9442               switch (i.tm.opcode_length)
9443                 {
9444                 case 3:
9445                 case 2:
9446                 case 1:
9447                   break;
9448                 case 0:
9449                   /* Check for pseudo prefixes.  */
9450                   as_bad_where (insn_start_frag->fr_file,
9451                                 insn_start_frag->fr_line,
9452                                 _("pseudo prefix without instruction"));
9453                   return;
9454                 default:
9455                   abort ();
9456                 }
9457               break;
9458             default:
9459               abort ();
9460             }
9461
9462 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9463           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9464              R_X86_64_GOTTPOFF relocation so that linker can safely
9465              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9466              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9467              relocation for GDesc -> IE/LE optimization.  */
9468           if (x86_elf_abi == X86_64_X32_ABI
9469               && i.operands == 2
9470               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9471                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9472               && i.prefix[REX_PREFIX] == 0)
9473             add_prefix (REX_OPCODE);
9474 #endif
9475
9476           /* The prefix bytes.  */
9477           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9478             if (*q)
9479               frag_opcode_byte (*q);
9480         }
9481       else
9482         {
9483           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9484             if (*q)
9485               switch (j)
9486                 {
9487                 case SEG_PREFIX:
9488                 case ADDR_PREFIX:
9489                   frag_opcode_byte (*q);
9490                   break;
9491                 default:
9492                   /* There should be no other prefixes for instructions
9493                      with VEX prefix.  */
9494                   abort ();
9495                 }
9496
9497           /* For EVEX instructions i.vrex should become 0 after
9498              build_evex_prefix.  For VEX instructions upper 16 registers
9499              aren't available, so VREX should be 0.  */
9500           if (i.vrex)
9501             abort ();
9502           /* Now the VEX prefix.  */
9503           if (now_seg != absolute_section)
9504             {
9505               p = frag_more (i.vex.length);
9506               for (j = 0; j < i.vex.length; j++)
9507                 p[j] = i.vex.bytes[j];
9508             }
9509           else
9510             abs_section_offset += i.vex.length;
9511         }
9512
9513       /* Now the opcode; be careful about word order here!  */
9514       if (now_seg == absolute_section)
9515         abs_section_offset += i.tm.opcode_length;
9516       else if (i.tm.opcode_length == 1)
9517         {
9518           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9519         }
9520       else
9521         {
9522           switch (i.tm.opcode_length)
9523             {
9524             case 4:
9525               p = frag_more (4);
9526               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9527               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9528               break;
9529             case 3:
9530               p = frag_more (3);
9531               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9532               break;
9533             case 2:
9534               p = frag_more (2);
9535               break;
9536             default:
9537               abort ();
9538               break;
9539             }
9540
9541           /* Put out high byte first: can't use md_number_to_chars!  */
9542           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9543           *p = i.tm.base_opcode & 0xff;
9544         }
9545
9546       /* Now the modrm byte and sib byte (if present).  */
9547       if (i.tm.opcode_modifier.modrm)
9548         {
9549           frag_opcode_byte ((i.rm.regmem << 0)
9550                              | (i.rm.reg << 3)
9551                              | (i.rm.mode << 6));
9552           /* If i.rm.regmem == ESP (4)
9553              && i.rm.mode != (Register mode)
9554              && not 16 bit
9555              ==> need second modrm byte.  */
9556           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9557               && i.rm.mode != 3
9558               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9559             frag_opcode_byte ((i.sib.base << 0)
9560                               | (i.sib.index << 3)
9561                               | (i.sib.scale << 6));
9562         }
9563
9564       if (i.disp_operands)
9565         output_disp (insn_start_frag, insn_start_off);
9566
9567       if (i.imm_operands)
9568         output_imm (insn_start_frag, insn_start_off);
9569
9570       /*
9571        * frag_now_fix () returning plain abs_section_offset when we're in the
9572        * absolute section, and abs_section_offset not getting updated as data
9573        * gets added to the frag breaks the logic below.
9574        */
9575       if (now_seg != absolute_section)
9576         {
9577           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9578           if (j > 15)
9579             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9580                      j);
9581           else if (fragP)
9582             {
9583               /* NB: Don't add prefix with GOTPC relocation since
9584                  output_disp() above depends on the fixed encoding
9585                  length.  Can't add prefix with TLS relocation since
9586                  it breaks TLS linker optimization.  */
9587               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9588               /* Prefix count on the current instruction.  */
9589               unsigned int count = i.vex.length;
9590               unsigned int k;
9591               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9592                 /* REX byte is encoded in VEX/EVEX prefix.  */
9593                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9594                   count++;
9595
9596               /* Count prefixes for extended opcode maps.  */
9597               if (!i.vex.length)
9598                 switch (i.tm.opcode_length)
9599                   {
9600                   case 3:
9601                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9602                       {
9603                         count++;
9604                         switch ((i.tm.base_opcode >> 8) & 0xff)
9605                           {
9606                           case 0x38:
9607                           case 0x3a:
9608                             count++;
9609                             break;
9610                           default:
9611                             break;
9612                           }
9613                       }
9614                     break;
9615                   case 2:
9616                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9617                       count++;
9618                     break;
9619                   case 1:
9620                     break;
9621                   default:
9622                     abort ();
9623                   }
9624
9625               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9626                   == BRANCH_PREFIX)
9627                 {
9628                   /* Set the maximum prefix size in BRANCH_PREFIX
9629                      frag.  */
9630                   if (fragP->tc_frag_data.max_bytes > max)
9631                     fragP->tc_frag_data.max_bytes = max;
9632                   if (fragP->tc_frag_data.max_bytes > count)
9633                     fragP->tc_frag_data.max_bytes -= count;
9634                   else
9635                     fragP->tc_frag_data.max_bytes = 0;
9636                 }
9637               else
9638                 {
9639                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9640                      frag.  */
9641                   unsigned int max_prefix_size;
9642                   if (align_branch_prefix_size > max)
9643                     max_prefix_size = max;
9644                   else
9645                     max_prefix_size = align_branch_prefix_size;
9646                   if (max_prefix_size > count)
9647                     fragP->tc_frag_data.max_prefix_length
9648                       = max_prefix_size - count;
9649                 }
9650
9651               /* Use existing segment prefix if possible.  Use CS
9652                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9653                  segment prefix with ESP/EBP base register and use DS
9654                  segment prefix without ESP/EBP base register.  */
9655               if (i.prefix[SEG_PREFIX])
9656                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9657               else if (flag_code == CODE_64BIT)
9658                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9659               else if (i.base_reg
9660                        && (i.base_reg->reg_num == 4
9661                            || i.base_reg->reg_num == 5))
9662                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9663               else
9664                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9665             }
9666         }
9667     }
9668
9669   /* NB: Don't work with COND_JUMP86 without i386.  */
9670   if (align_branch_power
9671       && now_seg != absolute_section
9672       && cpu_arch_flags.bitfield.cpui386)
9673     {
9674       /* Terminate each frag so that we can add prefix and check for
9675          fused jcc.  */
9676       frag_wane (frag_now);
9677       frag_new (0);
9678     }
9679
9680 #ifdef DEBUG386
9681   if (flag_debug)
9682     {
9683       pi ("" /*line*/, &i);
9684     }
9685 #endif /* DEBUG386  */
9686 }
9687
9688 /* Return the size of the displacement operand N.  */
9689
9690 static int
9691 disp_size (unsigned int n)
9692 {
9693   int size = 4;
9694
9695   if (i.types[n].bitfield.disp64)
9696     size = 8;
9697   else if (i.types[n].bitfield.disp8)
9698     size = 1;
9699   else if (i.types[n].bitfield.disp16)
9700     size = 2;
9701   return size;
9702 }
9703
9704 /* Return the size of the immediate operand N.  */
9705
9706 static int
9707 imm_size (unsigned int n)
9708 {
9709   int size = 4;
9710   if (i.types[n].bitfield.imm64)
9711     size = 8;
9712   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9713     size = 1;
9714   else if (i.types[n].bitfield.imm16)
9715     size = 2;
9716   return size;
9717 }
9718
9719 static void
9720 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9721 {
9722   char *p;
9723   unsigned int n;
9724
9725   for (n = 0; n < i.operands; n++)
9726     {
9727       if (operand_type_check (i.types[n], disp))
9728         {
9729           int size = disp_size (n);
9730
9731           if (now_seg == absolute_section)
9732             abs_section_offset += size;
9733           else if (i.op[n].disps->X_op == O_constant)
9734             {
9735               offsetT val = i.op[n].disps->X_add_number;
9736
9737               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9738                                      size);
9739               p = frag_more (size);
9740               md_number_to_chars (p, val, size);
9741             }
9742           else
9743             {
9744               enum bfd_reloc_code_real reloc_type;
9745               int sign = i.types[n].bitfield.disp32s;
9746               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9747               fixS *fixP;
9748
9749               /* We can't have 8 bit displacement here.  */
9750               gas_assert (!i.types[n].bitfield.disp8);
9751
9752               /* The PC relative address is computed relative
9753                  to the instruction boundary, so in case immediate
9754                  fields follows, we need to adjust the value.  */
9755               if (pcrel && i.imm_operands)
9756                 {
9757                   unsigned int n1;
9758                   int sz = 0;
9759
9760                   for (n1 = 0; n1 < i.operands; n1++)
9761                     if (operand_type_check (i.types[n1], imm))
9762                       {
9763                         /* Only one immediate is allowed for PC
9764                            relative address.  */
9765                         gas_assert (sz == 0);
9766                         sz = imm_size (n1);
9767                         i.op[n].disps->X_add_number -= sz;
9768                       }
9769                   /* We should find the immediate.  */
9770                   gas_assert (sz != 0);
9771                 }
9772
9773               p = frag_more (size);
9774               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9775               if (GOT_symbol
9776                   && GOT_symbol == i.op[n].disps->X_add_symbol
9777                   && (((reloc_type == BFD_RELOC_32
9778                         || reloc_type == BFD_RELOC_X86_64_32S
9779                         || (reloc_type == BFD_RELOC_64
9780                             && object_64bit))
9781                        && (i.op[n].disps->X_op == O_symbol
9782                            || (i.op[n].disps->X_op == O_add
9783                                && ((symbol_get_value_expression
9784                                     (i.op[n].disps->X_op_symbol)->X_op)
9785                                    == O_subtract))))
9786                       || reloc_type == BFD_RELOC_32_PCREL))
9787                 {
9788                   if (!object_64bit)
9789                     {
9790                       reloc_type = BFD_RELOC_386_GOTPC;
9791                       i.has_gotpc_tls_reloc = TRUE;
9792                       i.op[n].imms->X_add_number +=
9793                         encoding_length (insn_start_frag, insn_start_off, p);
9794                     }
9795                   else if (reloc_type == BFD_RELOC_64)
9796                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9797                   else
9798                     /* Don't do the adjustment for x86-64, as there
9799                        the pcrel addressing is relative to the _next_
9800                        insn, and that is taken care of in other code.  */
9801                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9802                 }
9803               else if (align_branch_power)
9804                 {
9805                   switch (reloc_type)
9806                     {
9807                     case BFD_RELOC_386_TLS_GD:
9808                     case BFD_RELOC_386_TLS_LDM:
9809                     case BFD_RELOC_386_TLS_IE:
9810                     case BFD_RELOC_386_TLS_IE_32:
9811                     case BFD_RELOC_386_TLS_GOTIE:
9812                     case BFD_RELOC_386_TLS_GOTDESC:
9813                     case BFD_RELOC_386_TLS_DESC_CALL:
9814                     case BFD_RELOC_X86_64_TLSGD:
9815                     case BFD_RELOC_X86_64_TLSLD:
9816                     case BFD_RELOC_X86_64_GOTTPOFF:
9817                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9818                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9819                       i.has_gotpc_tls_reloc = TRUE;
9820                     default:
9821                       break;
9822                     }
9823                 }
9824               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9825                                   size, i.op[n].disps, pcrel,
9826                                   reloc_type);
9827               /* Check for "call/jmp *mem", "mov mem, %reg",
9828                  "test %reg, mem" and "binop mem, %reg" where binop
9829                  is one of adc, add, and, cmp, or, sbb, sub, xor
9830                  instructions without data prefix.  Always generate
9831                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9832               if (i.prefix[DATA_PREFIX] == 0
9833                   && (generate_relax_relocations
9834                       || (!object_64bit
9835                           && i.rm.mode == 0
9836                           && i.rm.regmem == 5))
9837                   && (i.rm.mode == 2
9838                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9839                   && !is_any_vex_encoding(&i.tm)
9840                   && ((i.operands == 1
9841                        && i.tm.base_opcode == 0xff
9842                        && (i.rm.reg == 2 || i.rm.reg == 4))
9843                       || (i.operands == 2
9844                           && (i.tm.base_opcode == 0x8b
9845                               || i.tm.base_opcode == 0x85
9846                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9847                 {
9848                   if (object_64bit)
9849                     {
9850                       fixP->fx_tcbit = i.rex != 0;
9851                       if (i.base_reg
9852                           && (i.base_reg->reg_num == RegIP))
9853                       fixP->fx_tcbit2 = 1;
9854                     }
9855                   else
9856                     fixP->fx_tcbit2 = 1;
9857                 }
9858             }
9859         }
9860     }
9861 }
9862
9863 static void
9864 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9865 {
9866   char *p;
9867   unsigned int n;
9868
9869   for (n = 0; n < i.operands; n++)
9870     {
9871       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9872       if (i.rounding && (int) n == i.rounding->operand)
9873         continue;
9874
9875       if (operand_type_check (i.types[n], imm))
9876         {
9877           int size = imm_size (n);
9878
9879           if (now_seg == absolute_section)
9880             abs_section_offset += size;
9881           else if (i.op[n].imms->X_op == O_constant)
9882             {
9883               offsetT val;
9884
9885               val = offset_in_range (i.op[n].imms->X_add_number,
9886                                      size);
9887               p = frag_more (size);
9888               md_number_to_chars (p, val, size);
9889             }
9890           else
9891             {
9892               /* Not absolute_section.
9893                  Need a 32-bit fixup (don't support 8bit
9894                  non-absolute imms).  Try to support other
9895                  sizes ...  */
9896               enum bfd_reloc_code_real reloc_type;
9897               int sign;
9898
9899               if (i.types[n].bitfield.imm32s
9900                   && (i.suffix == QWORD_MNEM_SUFFIX
9901                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9902                 sign = 1;
9903               else
9904                 sign = 0;
9905
9906               p = frag_more (size);
9907               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9908
9909               /*   This is tough to explain.  We end up with this one if we
9910                * have operands that look like
9911                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9912                * obtain the absolute address of the GOT, and it is strongly
9913                * preferable from a performance point of view to avoid using
9914                * a runtime relocation for this.  The actual sequence of
9915                * instructions often look something like:
9916                *
9917                *        call    .L66
9918                * .L66:
9919                *        popl    %ebx
9920                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9921                *
9922                *   The call and pop essentially return the absolute address
9923                * of the label .L66 and store it in %ebx.  The linker itself
9924                * will ultimately change the first operand of the addl so
9925                * that %ebx points to the GOT, but to keep things simple, the
9926                * .o file must have this operand set so that it generates not
9927                * the absolute address of .L66, but the absolute address of
9928                * itself.  This allows the linker itself simply treat a GOTPC
9929                * relocation as asking for a pcrel offset to the GOT to be
9930                * added in, and the addend of the relocation is stored in the
9931                * operand field for the instruction itself.
9932                *
9933                *   Our job here is to fix the operand so that it would add
9934                * the correct offset so that %ebx would point to itself.  The
9935                * thing that is tricky is that .-.L66 will point to the
9936                * beginning of the instruction, so we need to further modify
9937                * the operand so that it will point to itself.  There are
9938                * other cases where you have something like:
9939                *
9940                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9941                *
9942                * and here no correction would be required.  Internally in
9943                * the assembler we treat operands of this form as not being
9944                * pcrel since the '.' is explicitly mentioned, and I wonder
9945                * whether it would simplify matters to do it this way.  Who
9946                * knows.  In earlier versions of the PIC patches, the
9947                * pcrel_adjust field was used to store the correction, but
9948                * since the expression is not pcrel, I felt it would be
9949                * confusing to do it this way.  */
9950
9951               if ((reloc_type == BFD_RELOC_32
9952                    || reloc_type == BFD_RELOC_X86_64_32S
9953                    || reloc_type == BFD_RELOC_64)
9954                   && GOT_symbol
9955                   && GOT_symbol == i.op[n].imms->X_add_symbol
9956                   && (i.op[n].imms->X_op == O_symbol
9957                       || (i.op[n].imms->X_op == O_add
9958                           && ((symbol_get_value_expression
9959                                (i.op[n].imms->X_op_symbol)->X_op)
9960                               == O_subtract))))
9961                 {
9962                   if (!object_64bit)
9963                     reloc_type = BFD_RELOC_386_GOTPC;
9964                   else if (size == 4)
9965                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9966                   else if (size == 8)
9967                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9968                   i.has_gotpc_tls_reloc = TRUE;
9969                   i.op[n].imms->X_add_number +=
9970                     encoding_length (insn_start_frag, insn_start_off, p);
9971                 }
9972               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9973                            i.op[n].imms, 0, reloc_type);
9974             }
9975         }
9976     }
9977 }
9978 \f
9979 /* x86_cons_fix_new is called via the expression parsing code when a
9980    reloc is needed.  We use this hook to get the correct .got reloc.  */
9981 static int cons_sign = -1;
9982
9983 void
9984 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9985                   expressionS *exp, bfd_reloc_code_real_type r)
9986 {
9987   r = reloc (len, 0, cons_sign, r);
9988
9989 #ifdef TE_PE
9990   if (exp->X_op == O_secrel)
9991     {
9992       exp->X_op = O_symbol;
9993       r = BFD_RELOC_32_SECREL;
9994     }
9995 #endif
9996
9997   fix_new_exp (frag, off, len, exp, 0, r);
9998 }
9999
10000 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
10001    purpose of the `.dc.a' internal pseudo-op.  */
10002
10003 int
10004 x86_address_bytes (void)
10005 {
10006   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
10007     return 4;
10008   return stdoutput->arch_info->bits_per_address / 8;
10009 }
10010
10011 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
10012     || defined (LEX_AT)
10013 # define lex_got(reloc, adjust, types) NULL
10014 #else
10015 /* Parse operands of the form
10016    <symbol>@GOTOFF+<nnn>
10017    and similar .plt or .got references.
10018
10019    If we find one, set up the correct relocation in RELOC and copy the
10020    input string, minus the `@GOTOFF' into a malloc'd buffer for
10021    parsing by the calling routine.  Return this buffer, and if ADJUST
10022    is non-null set it to the length of the string we removed from the
10023    input line.  Otherwise return NULL.  */
10024 static char *
10025 lex_got (enum bfd_reloc_code_real *rel,
10026          int *adjust,
10027          i386_operand_type *types)
10028 {
10029   /* Some of the relocations depend on the size of what field is to
10030      be relocated.  But in our callers i386_immediate and i386_displacement
10031      we don't yet know the operand size (this will be set by insn
10032      matching).  Hence we record the word32 relocation here,
10033      and adjust the reloc according to the real size in reloc().  */
10034   static const struct {
10035     const char *str;
10036     int len;
10037     const enum bfd_reloc_code_real rel[2];
10038     const i386_operand_type types64;
10039     bfd_boolean need_GOT_symbol;
10040   } gotrel[] = {
10041 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10042     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
10043                                         BFD_RELOC_SIZE32 },
10044       OPERAND_TYPE_IMM32_64, FALSE },
10045 #endif
10046     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
10047                                        BFD_RELOC_X86_64_PLTOFF64 },
10048       OPERAND_TYPE_IMM64, TRUE },
10049     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
10050                                        BFD_RELOC_X86_64_PLT32    },
10051       OPERAND_TYPE_IMM32_32S_DISP32, FALSE },
10052     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
10053                                        BFD_RELOC_X86_64_GOTPLT64 },
10054       OPERAND_TYPE_IMM64_DISP64, TRUE },
10055     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
10056                                        BFD_RELOC_X86_64_GOTOFF64 },
10057       OPERAND_TYPE_IMM64_DISP64, TRUE },
10058     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10059                                        BFD_RELOC_X86_64_GOTPCREL },
10060       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10061     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
10062                                        BFD_RELOC_X86_64_TLSGD    },
10063       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10064     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
10065                                        _dummy_first_bfd_reloc_code_real },
10066       OPERAND_TYPE_NONE, TRUE },
10067     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
10068                                        BFD_RELOC_X86_64_TLSLD    },
10069       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10070     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10071                                        BFD_RELOC_X86_64_GOTTPOFF },
10072       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10073     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
10074                                        BFD_RELOC_X86_64_TPOFF32  },
10075       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10076     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
10077                                        _dummy_first_bfd_reloc_code_real },
10078       OPERAND_TYPE_NONE, TRUE },
10079     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
10080                                        BFD_RELOC_X86_64_DTPOFF32 },
10081       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10082     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10083                                        _dummy_first_bfd_reloc_code_real },
10084       OPERAND_TYPE_NONE, TRUE },
10085     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10086                                        _dummy_first_bfd_reloc_code_real },
10087       OPERAND_TYPE_NONE, TRUE },
10088     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
10089                                        BFD_RELOC_X86_64_GOT32    },
10090       OPERAND_TYPE_IMM32_32S_64_DISP32, TRUE },
10091     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10092                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10093       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10094     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10095                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10096       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10097   };
10098   char *cp;
10099   unsigned int j;
10100
10101 #if defined (OBJ_MAYBE_ELF)
10102   if (!IS_ELF)
10103     return NULL;
10104 #endif
10105
10106   for (cp = input_line_pointer; *cp != '@'; cp++)
10107     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10108       return NULL;
10109
10110   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10111     {
10112       int len = gotrel[j].len;
10113       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10114         {
10115           if (gotrel[j].rel[object_64bit] != 0)
10116             {
10117               int first, second;
10118               char *tmpbuf, *past_reloc;
10119
10120               *rel = gotrel[j].rel[object_64bit];
10121
10122               if (types)
10123                 {
10124                   if (flag_code != CODE_64BIT)
10125                     {
10126                       types->bitfield.imm32 = 1;
10127                       types->bitfield.disp32 = 1;
10128                     }
10129                   else
10130                     *types = gotrel[j].types64;
10131                 }
10132
10133               if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10134                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10135
10136               /* The length of the first part of our input line.  */
10137               first = cp - input_line_pointer;
10138
10139               /* The second part goes from after the reloc token until
10140                  (and including) an end_of_line char or comma.  */
10141               past_reloc = cp + 1 + len;
10142               cp = past_reloc;
10143               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10144                 ++cp;
10145               second = cp + 1 - past_reloc;
10146
10147               /* Allocate and copy string.  The trailing NUL shouldn't
10148                  be necessary, but be safe.  */
10149               tmpbuf = XNEWVEC (char, first + second + 2);
10150               memcpy (tmpbuf, input_line_pointer, first);
10151               if (second != 0 && *past_reloc != ' ')
10152                 /* Replace the relocation token with ' ', so that
10153                    errors like foo@GOTOFF1 will be detected.  */
10154                 tmpbuf[first++] = ' ';
10155               else
10156                 /* Increment length by 1 if the relocation token is
10157                    removed.  */
10158                 len++;
10159               if (adjust)
10160                 *adjust = len;
10161               memcpy (tmpbuf + first, past_reloc, second);
10162               tmpbuf[first + second] = '\0';
10163               return tmpbuf;
10164             }
10165
10166           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10167                   gotrel[j].str, 1 << (5 + object_64bit));
10168           return NULL;
10169         }
10170     }
10171
10172   /* Might be a symbol version string.  Don't as_bad here.  */
10173   return NULL;
10174 }
10175 #endif
10176
10177 #ifdef TE_PE
10178 #ifdef lex_got
10179 #undef lex_got
10180 #endif
10181 /* Parse operands of the form
10182    <symbol>@SECREL32+<nnn>
10183
10184    If we find one, set up the correct relocation in RELOC and copy the
10185    input string, minus the `@SECREL32' into a malloc'd buffer for
10186    parsing by the calling routine.  Return this buffer, and if ADJUST
10187    is non-null set it to the length of the string we removed from the
10188    input line.  Otherwise return NULL.
10189
10190    This function is copied from the ELF version above adjusted for PE targets.  */
10191
10192 static char *
10193 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10194          int *adjust ATTRIBUTE_UNUSED,
10195          i386_operand_type *types)
10196 {
10197   static const struct
10198   {
10199     const char *str;
10200     int len;
10201     const enum bfd_reloc_code_real rel[2];
10202     const i386_operand_type types64;
10203   }
10204   gotrel[] =
10205   {
10206     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10207                                           BFD_RELOC_32_SECREL },
10208       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10209   };
10210
10211   char *cp;
10212   unsigned j;
10213
10214   for (cp = input_line_pointer; *cp != '@'; cp++)
10215     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10216       return NULL;
10217
10218   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10219     {
10220       int len = gotrel[j].len;
10221
10222       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10223         {
10224           if (gotrel[j].rel[object_64bit] != 0)
10225             {
10226               int first, second;
10227               char *tmpbuf, *past_reloc;
10228
10229               *rel = gotrel[j].rel[object_64bit];
10230               if (adjust)
10231                 *adjust = len;
10232
10233               if (types)
10234                 {
10235                   if (flag_code != CODE_64BIT)
10236                     {
10237                       types->bitfield.imm32 = 1;
10238                       types->bitfield.disp32 = 1;
10239                     }
10240                   else
10241                     *types = gotrel[j].types64;
10242                 }
10243
10244               /* The length of the first part of our input line.  */
10245               first = cp - input_line_pointer;
10246
10247               /* The second part goes from after the reloc token until
10248                  (and including) an end_of_line char or comma.  */
10249               past_reloc = cp + 1 + len;
10250               cp = past_reloc;
10251               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10252                 ++cp;
10253               second = cp + 1 - past_reloc;
10254
10255               /* Allocate and copy string.  The trailing NUL shouldn't
10256                  be necessary, but be safe.  */
10257               tmpbuf = XNEWVEC (char, first + second + 2);
10258               memcpy (tmpbuf, input_line_pointer, first);
10259               if (second != 0 && *past_reloc != ' ')
10260                 /* Replace the relocation token with ' ', so that
10261                    errors like foo@SECLREL321 will be detected.  */
10262                 tmpbuf[first++] = ' ';
10263               memcpy (tmpbuf + first, past_reloc, second);
10264               tmpbuf[first + second] = '\0';
10265               return tmpbuf;
10266             }
10267
10268           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10269                   gotrel[j].str, 1 << (5 + object_64bit));
10270           return NULL;
10271         }
10272     }
10273
10274   /* Might be a symbol version string.  Don't as_bad here.  */
10275   return NULL;
10276 }
10277
10278 #endif /* TE_PE */
10279
10280 bfd_reloc_code_real_type
10281 x86_cons (expressionS *exp, int size)
10282 {
10283   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10284
10285   intel_syntax = -intel_syntax;
10286
10287   exp->X_md = 0;
10288   if (size == 4 || (object_64bit && size == 8))
10289     {
10290       /* Handle @GOTOFF and the like in an expression.  */
10291       char *save;
10292       char *gotfree_input_line;
10293       int adjust = 0;
10294
10295       save = input_line_pointer;
10296       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10297       if (gotfree_input_line)
10298         input_line_pointer = gotfree_input_line;
10299
10300       expression (exp);
10301
10302       if (gotfree_input_line)
10303         {
10304           /* expression () has merrily parsed up to the end of line,
10305              or a comma - in the wrong buffer.  Transfer how far
10306              input_line_pointer has moved to the right buffer.  */
10307           input_line_pointer = (save
10308                                 + (input_line_pointer - gotfree_input_line)
10309                                 + adjust);
10310           free (gotfree_input_line);
10311           if (exp->X_op == O_constant
10312               || exp->X_op == O_absent
10313               || exp->X_op == O_illegal
10314               || exp->X_op == O_register
10315               || exp->X_op == O_big)
10316             {
10317               char c = *input_line_pointer;
10318               *input_line_pointer = 0;
10319               as_bad (_("missing or invalid expression `%s'"), save);
10320               *input_line_pointer = c;
10321             }
10322           else if ((got_reloc == BFD_RELOC_386_PLT32
10323                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10324                    && exp->X_op != O_symbol)
10325             {
10326               char c = *input_line_pointer;
10327               *input_line_pointer = 0;
10328               as_bad (_("invalid PLT expression `%s'"), save);
10329               *input_line_pointer = c;
10330             }
10331         }
10332     }
10333   else
10334     expression (exp);
10335
10336   intel_syntax = -intel_syntax;
10337
10338   if (intel_syntax)
10339     i386_intel_simplify (exp);
10340
10341   return got_reloc;
10342 }
10343
10344 static void
10345 signed_cons (int size)
10346 {
10347   if (flag_code == CODE_64BIT)
10348     cons_sign = 1;
10349   cons (size);
10350   cons_sign = -1;
10351 }
10352
10353 #ifdef TE_PE
10354 static void
10355 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10356 {
10357   expressionS exp;
10358
10359   do
10360     {
10361       expression (&exp);
10362       if (exp.X_op == O_symbol)
10363         exp.X_op = O_secrel;
10364
10365       emit_expr (&exp, 4);
10366     }
10367   while (*input_line_pointer++ == ',');
10368
10369   input_line_pointer--;
10370   demand_empty_rest_of_line ();
10371 }
10372 #endif
10373
10374 /* Handle Vector operations.  */
10375
10376 static char *
10377 check_VecOperations (char *op_string, char *op_end)
10378 {
10379   const reg_entry *mask;
10380   const char *saved;
10381   char *end_op;
10382
10383   while (*op_string
10384          && (op_end == NULL || op_string < op_end))
10385     {
10386       saved = op_string;
10387       if (*op_string == '{')
10388         {
10389           op_string++;
10390
10391           /* Check broadcasts.  */
10392           if (strncmp (op_string, "1to", 3) == 0)
10393             {
10394               int bcst_type;
10395
10396               if (i.broadcast)
10397                 goto duplicated_vec_op;
10398
10399               op_string += 3;
10400               if (*op_string == '8')
10401                 bcst_type = 8;
10402               else if (*op_string == '4')
10403                 bcst_type = 4;
10404               else if (*op_string == '2')
10405                 bcst_type = 2;
10406               else if (*op_string == '1'
10407                        && *(op_string+1) == '6')
10408                 {
10409                   bcst_type = 16;
10410                   op_string++;
10411                 }
10412               else
10413                 {
10414                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10415                   return NULL;
10416                 }
10417               op_string++;
10418
10419               broadcast_op.type = bcst_type;
10420               broadcast_op.operand = this_operand;
10421               broadcast_op.bytes = 0;
10422               i.broadcast = &broadcast_op;
10423             }
10424           /* Check masking operation.  */
10425           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10426             {
10427               if (mask == &bad_reg)
10428                 return NULL;
10429
10430               /* k0 can't be used for write mask.  */
10431               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10432                 {
10433                   as_bad (_("`%s%s' can't be used for write mask"),
10434                           register_prefix, mask->reg_name);
10435                   return NULL;
10436                 }
10437
10438               if (!i.mask)
10439                 {
10440                   mask_op.mask = mask;
10441                   mask_op.zeroing = 0;
10442                   mask_op.operand = this_operand;
10443                   i.mask = &mask_op;
10444                 }
10445               else
10446                 {
10447                   if (i.mask->mask)
10448                     goto duplicated_vec_op;
10449
10450                   i.mask->mask = mask;
10451
10452                   /* Only "{z}" is allowed here.  No need to check
10453                      zeroing mask explicitly.  */
10454                   if (i.mask->operand != this_operand)
10455                     {
10456                       as_bad (_("invalid write mask `%s'"), saved);
10457                       return NULL;
10458                     }
10459                 }
10460
10461               op_string = end_op;
10462             }
10463           /* Check zeroing-flag for masking operation.  */
10464           else if (*op_string == 'z')
10465             {
10466               if (!i.mask)
10467                 {
10468                   mask_op.mask = NULL;
10469                   mask_op.zeroing = 1;
10470                   mask_op.operand = this_operand;
10471                   i.mask = &mask_op;
10472                 }
10473               else
10474                 {
10475                   if (i.mask->zeroing)
10476                     {
10477                     duplicated_vec_op:
10478                       as_bad (_("duplicated `%s'"), saved);
10479                       return NULL;
10480                     }
10481
10482                   i.mask->zeroing = 1;
10483
10484                   /* Only "{%k}" is allowed here.  No need to check mask
10485                      register explicitly.  */
10486                   if (i.mask->operand != this_operand)
10487                     {
10488                       as_bad (_("invalid zeroing-masking `%s'"),
10489                               saved);
10490                       return NULL;
10491                     }
10492                 }
10493
10494               op_string++;
10495             }
10496           else
10497             goto unknown_vec_op;
10498
10499           if (*op_string != '}')
10500             {
10501               as_bad (_("missing `}' in `%s'"), saved);
10502               return NULL;
10503             }
10504           op_string++;
10505
10506           /* Strip whitespace since the addition of pseudo prefixes
10507              changed how the scrubber treats '{'.  */
10508           if (is_space_char (*op_string))
10509             ++op_string;
10510
10511           continue;
10512         }
10513     unknown_vec_op:
10514       /* We don't know this one.  */
10515       as_bad (_("unknown vector operation: `%s'"), saved);
10516       return NULL;
10517     }
10518
10519   if (i.mask && i.mask->zeroing && !i.mask->mask)
10520     {
10521       as_bad (_("zeroing-masking only allowed with write mask"));
10522       return NULL;
10523     }
10524
10525   return op_string;
10526 }
10527
10528 static int
10529 i386_immediate (char *imm_start)
10530 {
10531   char *save_input_line_pointer;
10532   char *gotfree_input_line;
10533   segT exp_seg = 0;
10534   expressionS *exp;
10535   i386_operand_type types;
10536
10537   operand_type_set (&types, ~0);
10538
10539   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10540     {
10541       as_bad (_("at most %d immediate operands are allowed"),
10542               MAX_IMMEDIATE_OPERANDS);
10543       return 0;
10544     }
10545
10546   exp = &im_expressions[i.imm_operands++];
10547   i.op[this_operand].imms = exp;
10548
10549   if (is_space_char (*imm_start))
10550     ++imm_start;
10551
10552   save_input_line_pointer = input_line_pointer;
10553   input_line_pointer = imm_start;
10554
10555   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10556   if (gotfree_input_line)
10557     input_line_pointer = gotfree_input_line;
10558
10559   exp_seg = expression (exp);
10560
10561   SKIP_WHITESPACE ();
10562
10563   /* Handle vector operations.  */
10564   if (*input_line_pointer == '{')
10565     {
10566       input_line_pointer = check_VecOperations (input_line_pointer,
10567                                                 NULL);
10568       if (input_line_pointer == NULL)
10569         return 0;
10570     }
10571
10572   if (*input_line_pointer)
10573     as_bad (_("junk `%s' after expression"), input_line_pointer);
10574
10575   input_line_pointer = save_input_line_pointer;
10576   if (gotfree_input_line)
10577     {
10578       free (gotfree_input_line);
10579
10580       if (exp->X_op == O_constant || exp->X_op == O_register)
10581         exp->X_op = O_illegal;
10582     }
10583
10584   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10585 }
10586
10587 static int
10588 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10589                          i386_operand_type types, const char *imm_start)
10590 {
10591   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10592     {
10593       if (imm_start)
10594         as_bad (_("missing or invalid immediate expression `%s'"),
10595                 imm_start);
10596       return 0;
10597     }
10598   else if (exp->X_op == O_constant)
10599     {
10600       /* Size it properly later.  */
10601       i.types[this_operand].bitfield.imm64 = 1;
10602       /* If not 64bit, sign extend val.  */
10603       if (flag_code != CODE_64BIT
10604           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10605         exp->X_add_number
10606           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10607     }
10608 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10609   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10610            && exp_seg != absolute_section
10611            && exp_seg != text_section
10612            && exp_seg != data_section
10613            && exp_seg != bss_section
10614            && exp_seg != undefined_section
10615            && !bfd_is_com_section (exp_seg))
10616     {
10617       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10618       return 0;
10619     }
10620 #endif
10621   else if (!intel_syntax && exp_seg == reg_section)
10622     {
10623       if (imm_start)
10624         as_bad (_("illegal immediate register operand %s"), imm_start);
10625       return 0;
10626     }
10627   else
10628     {
10629       /* This is an address.  The size of the address will be
10630          determined later, depending on destination register,
10631          suffix, or the default for the section.  */
10632       i.types[this_operand].bitfield.imm8 = 1;
10633       i.types[this_operand].bitfield.imm16 = 1;
10634       i.types[this_operand].bitfield.imm32 = 1;
10635       i.types[this_operand].bitfield.imm32s = 1;
10636       i.types[this_operand].bitfield.imm64 = 1;
10637       i.types[this_operand] = operand_type_and (i.types[this_operand],
10638                                                 types);
10639     }
10640
10641   return 1;
10642 }
10643
10644 static char *
10645 i386_scale (char *scale)
10646 {
10647   offsetT val;
10648   char *save = input_line_pointer;
10649
10650   input_line_pointer = scale;
10651   val = get_absolute_expression ();
10652
10653   switch (val)
10654     {
10655     case 1:
10656       i.log2_scale_factor = 0;
10657       break;
10658     case 2:
10659       i.log2_scale_factor = 1;
10660       break;
10661     case 4:
10662       i.log2_scale_factor = 2;
10663       break;
10664     case 8:
10665       i.log2_scale_factor = 3;
10666       break;
10667     default:
10668       {
10669         char sep = *input_line_pointer;
10670
10671         *input_line_pointer = '\0';
10672         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10673                 scale);
10674         *input_line_pointer = sep;
10675         input_line_pointer = save;
10676         return NULL;
10677       }
10678     }
10679   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10680     {
10681       as_warn (_("scale factor of %d without an index register"),
10682                1 << i.log2_scale_factor);
10683       i.log2_scale_factor = 0;
10684     }
10685   scale = input_line_pointer;
10686   input_line_pointer = save;
10687   return scale;
10688 }
10689
10690 static int
10691 i386_displacement (char *disp_start, char *disp_end)
10692 {
10693   expressionS *exp;
10694   segT exp_seg = 0;
10695   char *save_input_line_pointer;
10696   char *gotfree_input_line;
10697   int override;
10698   i386_operand_type bigdisp, types = anydisp;
10699   int ret;
10700
10701   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10702     {
10703       as_bad (_("at most %d displacement operands are allowed"),
10704               MAX_MEMORY_OPERANDS);
10705       return 0;
10706     }
10707
10708   operand_type_set (&bigdisp, 0);
10709   if (i.jumpabsolute
10710       || i.types[this_operand].bitfield.baseindex
10711       || (current_templates->start->opcode_modifier.jump != JUMP
10712           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10713     {
10714       i386_addressing_mode ();
10715       override = (i.prefix[ADDR_PREFIX] != 0);
10716       if (flag_code == CODE_64BIT)
10717         {
10718           if (!override)
10719             {
10720               bigdisp.bitfield.disp32s = 1;
10721               bigdisp.bitfield.disp64 = 1;
10722             }
10723           else
10724             bigdisp.bitfield.disp32 = 1;
10725         }
10726       else if ((flag_code == CODE_16BIT) ^ override)
10727           bigdisp.bitfield.disp16 = 1;
10728       else
10729           bigdisp.bitfield.disp32 = 1;
10730     }
10731   else
10732     {
10733       /* For PC-relative branches, the width of the displacement may be
10734          dependent upon data size, but is never dependent upon address size.
10735          Also make sure to not unintentionally match against a non-PC-relative
10736          branch template.  */
10737       static templates aux_templates;
10738       const insn_template *t = current_templates->start;
10739       bfd_boolean has_intel64 = FALSE;
10740
10741       aux_templates.start = t;
10742       while (++t < current_templates->end)
10743         {
10744           if (t->opcode_modifier.jump
10745               != current_templates->start->opcode_modifier.jump)
10746             break;
10747           if ((t->opcode_modifier.isa64 >= INTEL64))
10748             has_intel64 = TRUE;
10749         }
10750       if (t < current_templates->end)
10751         {
10752           aux_templates.end = t;
10753           current_templates = &aux_templates;
10754         }
10755
10756       override = (i.prefix[DATA_PREFIX] != 0);
10757       if (flag_code == CODE_64BIT)
10758         {
10759           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10760               && (!intel64 || !has_intel64))
10761             bigdisp.bitfield.disp16 = 1;
10762           else
10763             bigdisp.bitfield.disp32s = 1;
10764         }
10765       else
10766         {
10767           if (!override)
10768             override = (i.suffix == (flag_code != CODE_16BIT
10769                                      ? WORD_MNEM_SUFFIX
10770                                      : LONG_MNEM_SUFFIX));
10771           bigdisp.bitfield.disp32 = 1;
10772           if ((flag_code == CODE_16BIT) ^ override)
10773             {
10774               bigdisp.bitfield.disp32 = 0;
10775               bigdisp.bitfield.disp16 = 1;
10776             }
10777         }
10778     }
10779   i.types[this_operand] = operand_type_or (i.types[this_operand],
10780                                            bigdisp);
10781
10782   exp = &disp_expressions[i.disp_operands];
10783   i.op[this_operand].disps = exp;
10784   i.disp_operands++;
10785   save_input_line_pointer = input_line_pointer;
10786   input_line_pointer = disp_start;
10787   END_STRING_AND_SAVE (disp_end);
10788
10789 #ifndef GCC_ASM_O_HACK
10790 #define GCC_ASM_O_HACK 0
10791 #endif
10792 #if GCC_ASM_O_HACK
10793   END_STRING_AND_SAVE (disp_end + 1);
10794   if (i.types[this_operand].bitfield.baseIndex
10795       && displacement_string_end[-1] == '+')
10796     {
10797       /* This hack is to avoid a warning when using the "o"
10798          constraint within gcc asm statements.
10799          For instance:
10800
10801          #define _set_tssldt_desc(n,addr,limit,type) \
10802          __asm__ __volatile__ ( \
10803          "movw %w2,%0\n\t" \
10804          "movw %w1,2+%0\n\t" \
10805          "rorl $16,%1\n\t" \
10806          "movb %b1,4+%0\n\t" \
10807          "movb %4,5+%0\n\t" \
10808          "movb $0,6+%0\n\t" \
10809          "movb %h1,7+%0\n\t" \
10810          "rorl $16,%1" \
10811          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10812
10813          This works great except that the output assembler ends
10814          up looking a bit weird if it turns out that there is
10815          no offset.  You end up producing code that looks like:
10816
10817          #APP
10818          movw $235,(%eax)
10819          movw %dx,2+(%eax)
10820          rorl $16,%edx
10821          movb %dl,4+(%eax)
10822          movb $137,5+(%eax)
10823          movb $0,6+(%eax)
10824          movb %dh,7+(%eax)
10825          rorl $16,%edx
10826          #NO_APP
10827
10828          So here we provide the missing zero.  */
10829
10830       *displacement_string_end = '0';
10831     }
10832 #endif
10833   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10834   if (gotfree_input_line)
10835     input_line_pointer = gotfree_input_line;
10836
10837   exp_seg = expression (exp);
10838
10839   SKIP_WHITESPACE ();
10840   if (*input_line_pointer)
10841     as_bad (_("junk `%s' after expression"), input_line_pointer);
10842 #if GCC_ASM_O_HACK
10843   RESTORE_END_STRING (disp_end + 1);
10844 #endif
10845   input_line_pointer = save_input_line_pointer;
10846   if (gotfree_input_line)
10847     {
10848       free (gotfree_input_line);
10849
10850       if (exp->X_op == O_constant || exp->X_op == O_register)
10851         exp->X_op = O_illegal;
10852     }
10853
10854   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10855
10856   RESTORE_END_STRING (disp_end);
10857
10858   return ret;
10859 }
10860
10861 static int
10862 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10863                             i386_operand_type types, const char *disp_start)
10864 {
10865   i386_operand_type bigdisp;
10866   int ret = 1;
10867
10868   /* We do this to make sure that the section symbol is in
10869      the symbol table.  We will ultimately change the relocation
10870      to be relative to the beginning of the section.  */
10871   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10872       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10873       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10874     {
10875       if (exp->X_op != O_symbol)
10876         goto inv_disp;
10877
10878       if (S_IS_LOCAL (exp->X_add_symbol)
10879           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10880           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10881         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10882       exp->X_op = O_subtract;
10883       exp->X_op_symbol = GOT_symbol;
10884       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10885         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10886       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10887         i.reloc[this_operand] = BFD_RELOC_64;
10888       else
10889         i.reloc[this_operand] = BFD_RELOC_32;
10890     }
10891
10892   else if (exp->X_op == O_absent
10893            || exp->X_op == O_illegal
10894            || exp->X_op == O_big)
10895     {
10896     inv_disp:
10897       as_bad (_("missing or invalid displacement expression `%s'"),
10898               disp_start);
10899       ret = 0;
10900     }
10901
10902   else if (flag_code == CODE_64BIT
10903            && !i.prefix[ADDR_PREFIX]
10904            && exp->X_op == O_constant)
10905     {
10906       /* Since displacement is signed extended to 64bit, don't allow
10907          disp32 and turn off disp32s if they are out of range.  */
10908       i.types[this_operand].bitfield.disp32 = 0;
10909       if (!fits_in_signed_long (exp->X_add_number))
10910         {
10911           i.types[this_operand].bitfield.disp32s = 0;
10912           if (i.types[this_operand].bitfield.baseindex)
10913             {
10914               as_bad (_("0x%lx out range of signed 32bit displacement"),
10915                       (long) exp->X_add_number);
10916               ret = 0;
10917             }
10918         }
10919     }
10920
10921 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10922   else if (exp->X_op != O_constant
10923            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10924            && exp_seg != absolute_section
10925            && exp_seg != text_section
10926            && exp_seg != data_section
10927            && exp_seg != bss_section
10928            && exp_seg != undefined_section
10929            && !bfd_is_com_section (exp_seg))
10930     {
10931       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10932       ret = 0;
10933     }
10934 #endif
10935
10936   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10937       /* Constants get taken care of by optimize_disp().  */
10938       && exp->X_op != O_constant)
10939     i.types[this_operand].bitfield.disp8 = 1;
10940
10941   /* Check if this is a displacement only operand.  */
10942   bigdisp = i.types[this_operand];
10943   bigdisp.bitfield.disp8 = 0;
10944   bigdisp.bitfield.disp16 = 0;
10945   bigdisp.bitfield.disp32 = 0;
10946   bigdisp.bitfield.disp32s = 0;
10947   bigdisp.bitfield.disp64 = 0;
10948   if (operand_type_all_zero (&bigdisp))
10949     i.types[this_operand] = operand_type_and (i.types[this_operand],
10950                                               types);
10951
10952   return ret;
10953 }
10954
10955 /* Return the active addressing mode, taking address override and
10956    registers forming the address into consideration.  Update the
10957    address override prefix if necessary.  */
10958
10959 static enum flag_code
10960 i386_addressing_mode (void)
10961 {
10962   enum flag_code addr_mode;
10963
10964   if (i.prefix[ADDR_PREFIX])
10965     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10966   else if (flag_code == CODE_16BIT
10967            && current_templates->start->cpu_flags.bitfield.cpumpx
10968            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10969               from md_assemble() by "is not a valid base/index expression"
10970               when there is a base and/or index.  */
10971            && !i.types[this_operand].bitfield.baseindex)
10972     {
10973       /* MPX insn memory operands with neither base nor index must be forced
10974          to use 32-bit addressing in 16-bit mode.  */
10975       addr_mode = CODE_32BIT;
10976       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10977       ++i.prefixes;
10978       gas_assert (!i.types[this_operand].bitfield.disp16);
10979       gas_assert (!i.types[this_operand].bitfield.disp32);
10980     }
10981   else
10982     {
10983       addr_mode = flag_code;
10984
10985 #if INFER_ADDR_PREFIX
10986       if (i.mem_operands == 0)
10987         {
10988           /* Infer address prefix from the first memory operand.  */
10989           const reg_entry *addr_reg = i.base_reg;
10990
10991           if (addr_reg == NULL)
10992             addr_reg = i.index_reg;
10993
10994           if (addr_reg)
10995             {
10996               if (addr_reg->reg_type.bitfield.dword)
10997                 addr_mode = CODE_32BIT;
10998               else if (flag_code != CODE_64BIT
10999                        && addr_reg->reg_type.bitfield.word)
11000                 addr_mode = CODE_16BIT;
11001
11002               if (addr_mode != flag_code)
11003                 {
11004                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11005                   i.prefixes += 1;
11006                   /* Change the size of any displacement too.  At most one
11007                      of Disp16 or Disp32 is set.
11008                      FIXME.  There doesn't seem to be any real need for
11009                      separate Disp16 and Disp32 flags.  The same goes for
11010                      Imm16 and Imm32.  Removing them would probably clean
11011                      up the code quite a lot.  */
11012                   if (flag_code != CODE_64BIT
11013                       && (i.types[this_operand].bitfield.disp16
11014                           || i.types[this_operand].bitfield.disp32))
11015                     i.types[this_operand]
11016                       = operand_type_xor (i.types[this_operand], disp16_32);
11017                 }
11018             }
11019         }
11020 #endif
11021     }
11022
11023   return addr_mode;
11024 }
11025
11026 /* Make sure the memory operand we've been dealt is valid.
11027    Return 1 on success, 0 on a failure.  */
11028
11029 static int
11030 i386_index_check (const char *operand_string)
11031 {
11032   const char *kind = "base/index";
11033   enum flag_code addr_mode = i386_addressing_mode ();
11034
11035   if (current_templates->start->opcode_modifier.isstring
11036       && !current_templates->start->cpu_flags.bitfield.cpupadlock
11037       && (current_templates->end[-1].opcode_modifier.isstring
11038           || i.mem_operands))
11039     {
11040       /* Memory operands of string insns are special in that they only allow
11041          a single register (rDI, rSI, or rBX) as their memory address.  */
11042       const reg_entry *expected_reg;
11043       static const char *di_si[][2] =
11044         {
11045           { "esi", "edi" },
11046           { "si", "di" },
11047           { "rsi", "rdi" }
11048         };
11049       static const char *bx[] = { "ebx", "bx", "rbx" };
11050
11051       kind = "string address";
11052
11053       if (current_templates->start->opcode_modifier.prefixok == PrefixRep)
11054         {
11055           int es_op = current_templates->end[-1].opcode_modifier.isstring
11056                       - IS_STRING_ES_OP0;
11057           int op = 0;
11058
11059           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11060               || ((!i.mem_operands != !intel_syntax)
11061                   && current_templates->end[-1].operand_types[1]
11062                      .bitfield.baseindex))
11063             op = 1;
11064           expected_reg
11065             = (const reg_entry *) str_hash_find (reg_hash,
11066                                                  di_si[addr_mode][op == es_op]);
11067         }
11068       else
11069         expected_reg
11070           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11071
11072       if (i.base_reg != expected_reg
11073           || i.index_reg
11074           || operand_type_check (i.types[this_operand], disp))
11075         {
11076           /* The second memory operand must have the same size as
11077              the first one.  */
11078           if (i.mem_operands
11079               && i.base_reg
11080               && !((addr_mode == CODE_64BIT
11081                     && i.base_reg->reg_type.bitfield.qword)
11082                    || (addr_mode == CODE_32BIT
11083                        ? i.base_reg->reg_type.bitfield.dword
11084                        : i.base_reg->reg_type.bitfield.word)))
11085             goto bad_address;
11086
11087           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11088                    operand_string,
11089                    intel_syntax ? '[' : '(',
11090                    register_prefix,
11091                    expected_reg->reg_name,
11092                    intel_syntax ? ']' : ')');
11093           return 1;
11094         }
11095       else
11096         return 1;
11097
11098     bad_address:
11099       as_bad (_("`%s' is not a valid %s expression"),
11100               operand_string, kind);
11101       return 0;
11102     }
11103   else
11104     {
11105       if (addr_mode != CODE_16BIT)
11106         {
11107           /* 32-bit/64-bit checks.  */
11108           if (i.disp_encoding == disp_encoding_16bit)
11109             {
11110             bad_disp:
11111               as_bad (_("invalid `%s' prefix"),
11112                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11113               return 0;
11114             }
11115
11116           if ((i.base_reg
11117                && ((addr_mode == CODE_64BIT
11118                     ? !i.base_reg->reg_type.bitfield.qword
11119                     : !i.base_reg->reg_type.bitfield.dword)
11120                    || (i.index_reg && i.base_reg->reg_num == RegIP)
11121                    || i.base_reg->reg_num == RegIZ))
11122               || (i.index_reg
11123                   && !i.index_reg->reg_type.bitfield.xmmword
11124                   && !i.index_reg->reg_type.bitfield.ymmword
11125                   && !i.index_reg->reg_type.bitfield.zmmword
11126                   && ((addr_mode == CODE_64BIT
11127                        ? !i.index_reg->reg_type.bitfield.qword
11128                        : !i.index_reg->reg_type.bitfield.dword)
11129                       || !i.index_reg->reg_type.bitfield.baseindex)))
11130             goto bad_address;
11131
11132           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11133           if (current_templates->start->base_opcode == 0xf30f1b
11134               || (current_templates->start->base_opcode & ~1) == 0x0f1a
11135               || current_templates->start->opcode_modifier.sib == SIBMEM)
11136             {
11137               /* They cannot use RIP-relative addressing. */
11138               if (i.base_reg && i.base_reg->reg_num == RegIP)
11139                 {
11140                   as_bad (_("`%s' cannot be used here"), operand_string);
11141                   return 0;
11142                 }
11143
11144               /* bndldx and bndstx ignore their scale factor. */
11145               if ((current_templates->start->base_opcode & ~1) == 0x0f1a
11146                   && i.log2_scale_factor)
11147                 as_warn (_("register scaling is being ignored here"));
11148             }
11149         }
11150       else
11151         {
11152           /* 16-bit checks.  */
11153           if (i.disp_encoding == disp_encoding_32bit)
11154             goto bad_disp;
11155
11156           if ((i.base_reg
11157                && (!i.base_reg->reg_type.bitfield.word
11158                    || !i.base_reg->reg_type.bitfield.baseindex))
11159               || (i.index_reg
11160                   && (!i.index_reg->reg_type.bitfield.word
11161                       || !i.index_reg->reg_type.bitfield.baseindex
11162                       || !(i.base_reg
11163                            && i.base_reg->reg_num < 6
11164                            && i.index_reg->reg_num >= 6
11165                            && i.log2_scale_factor == 0))))
11166             goto bad_address;
11167         }
11168     }
11169   return 1;
11170 }
11171
11172 /* Handle vector immediates.  */
11173
11174 static int
11175 RC_SAE_immediate (const char *imm_start)
11176 {
11177   unsigned int match_found, j;
11178   const char *pstr = imm_start;
11179   expressionS *exp;
11180
11181   if (*pstr != '{')
11182     return 0;
11183
11184   pstr++;
11185   match_found = 0;
11186   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11187     {
11188       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11189         {
11190           if (!i.rounding)
11191             {
11192               rc_op.type = RC_NamesTable[j].type;
11193               rc_op.operand = this_operand;
11194               i.rounding = &rc_op;
11195             }
11196           else
11197             {
11198               as_bad (_("duplicated `%s'"), imm_start);
11199               return 0;
11200             }
11201           pstr += RC_NamesTable[j].len;
11202           match_found = 1;
11203           break;
11204         }
11205     }
11206   if (!match_found)
11207     return 0;
11208
11209   if (*pstr++ != '}')
11210     {
11211       as_bad (_("Missing '}': '%s'"), imm_start);
11212       return 0;
11213     }
11214   /* RC/SAE immediate string should contain nothing more.  */;
11215   if (*pstr != 0)
11216     {
11217       as_bad (_("Junk after '}': '%s'"), imm_start);
11218       return 0;
11219     }
11220
11221   exp = &im_expressions[i.imm_operands++];
11222   i.op[this_operand].imms = exp;
11223
11224   exp->X_op = O_constant;
11225   exp->X_add_number = 0;
11226   exp->X_add_symbol = (symbolS *) 0;
11227   exp->X_op_symbol = (symbolS *) 0;
11228
11229   i.types[this_operand].bitfield.imm8 = 1;
11230   return 1;
11231 }
11232
11233 /* Only string instructions can have a second memory operand, so
11234    reduce current_templates to just those if it contains any.  */
11235 static int
11236 maybe_adjust_templates (void)
11237 {
11238   const insn_template *t;
11239
11240   gas_assert (i.mem_operands == 1);
11241
11242   for (t = current_templates->start; t < current_templates->end; ++t)
11243     if (t->opcode_modifier.isstring)
11244       break;
11245
11246   if (t < current_templates->end)
11247     {
11248       static templates aux_templates;
11249       bfd_boolean recheck;
11250
11251       aux_templates.start = t;
11252       for (; t < current_templates->end; ++t)
11253         if (!t->opcode_modifier.isstring)
11254           break;
11255       aux_templates.end = t;
11256
11257       /* Determine whether to re-check the first memory operand.  */
11258       recheck = (aux_templates.start != current_templates->start
11259                  || t != current_templates->end);
11260
11261       current_templates = &aux_templates;
11262
11263       if (recheck)
11264         {
11265           i.mem_operands = 0;
11266           if (i.memop1_string != NULL
11267               && i386_index_check (i.memop1_string) == 0)
11268             return 0;
11269           i.mem_operands = 1;
11270         }
11271     }
11272
11273   return 1;
11274 }
11275
11276 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11277    on error.  */
11278
11279 static int
11280 i386_att_operand (char *operand_string)
11281 {
11282   const reg_entry *r;
11283   char *end_op;
11284   char *op_string = operand_string;
11285
11286   if (is_space_char (*op_string))
11287     ++op_string;
11288
11289   /* We check for an absolute prefix (differentiating,
11290      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11291   if (*op_string == ABSOLUTE_PREFIX)
11292     {
11293       ++op_string;
11294       if (is_space_char (*op_string))
11295         ++op_string;
11296       i.jumpabsolute = TRUE;
11297     }
11298
11299   /* Check if operand is a register.  */
11300   if ((r = parse_register (op_string, &end_op)) != NULL)
11301     {
11302       i386_operand_type temp;
11303
11304       if (r == &bad_reg)
11305         return 0;
11306
11307       /* Check for a segment override by searching for ':' after a
11308          segment register.  */
11309       op_string = end_op;
11310       if (is_space_char (*op_string))
11311         ++op_string;
11312       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11313         {
11314           switch (r->reg_num)
11315             {
11316             case 0:
11317               i.seg[i.mem_operands] = &es;
11318               break;
11319             case 1:
11320               i.seg[i.mem_operands] = &cs;
11321               break;
11322             case 2:
11323               i.seg[i.mem_operands] = &ss;
11324               break;
11325             case 3:
11326               i.seg[i.mem_operands] = &ds;
11327               break;
11328             case 4:
11329               i.seg[i.mem_operands] = &fs;
11330               break;
11331             case 5:
11332               i.seg[i.mem_operands] = &gs;
11333               break;
11334             }
11335
11336           /* Skip the ':' and whitespace.  */
11337           ++op_string;
11338           if (is_space_char (*op_string))
11339             ++op_string;
11340
11341           if (!is_digit_char (*op_string)
11342               && !is_identifier_char (*op_string)
11343               && *op_string != '('
11344               && *op_string != ABSOLUTE_PREFIX)
11345             {
11346               as_bad (_("bad memory operand `%s'"), op_string);
11347               return 0;
11348             }
11349           /* Handle case of %es:*foo.  */
11350           if (*op_string == ABSOLUTE_PREFIX)
11351             {
11352               ++op_string;
11353               if (is_space_char (*op_string))
11354                 ++op_string;
11355               i.jumpabsolute = TRUE;
11356             }
11357           goto do_memory_reference;
11358         }
11359
11360       /* Handle vector operations.  */
11361       if (*op_string == '{')
11362         {
11363           op_string = check_VecOperations (op_string, NULL);
11364           if (op_string == NULL)
11365             return 0;
11366         }
11367
11368       if (*op_string)
11369         {
11370           as_bad (_("junk `%s' after register"), op_string);
11371           return 0;
11372         }
11373       temp = r->reg_type;
11374       temp.bitfield.baseindex = 0;
11375       i.types[this_operand] = operand_type_or (i.types[this_operand],
11376                                                temp);
11377       i.types[this_operand].bitfield.unspecified = 0;
11378       i.op[this_operand].regs = r;
11379       i.reg_operands++;
11380     }
11381   else if (*op_string == REGISTER_PREFIX)
11382     {
11383       as_bad (_("bad register name `%s'"), op_string);
11384       return 0;
11385     }
11386   else if (*op_string == IMMEDIATE_PREFIX)
11387     {
11388       ++op_string;
11389       if (i.jumpabsolute)
11390         {
11391           as_bad (_("immediate operand illegal with absolute jump"));
11392           return 0;
11393         }
11394       if (!i386_immediate (op_string))
11395         return 0;
11396     }
11397   else if (RC_SAE_immediate (operand_string))
11398     {
11399       /* If it is a RC or SAE immediate, do nothing.  */
11400       ;
11401     }
11402   else if (is_digit_char (*op_string)
11403            || is_identifier_char (*op_string)
11404            || *op_string == '"'
11405            || *op_string == '(')
11406     {
11407       /* This is a memory reference of some sort.  */
11408       char *base_string;
11409
11410       /* Start and end of displacement string expression (if found).  */
11411       char *displacement_string_start;
11412       char *displacement_string_end;
11413       char *vop_start;
11414
11415     do_memory_reference:
11416       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11417         return 0;
11418       if ((i.mem_operands == 1
11419            && !current_templates->start->opcode_modifier.isstring)
11420           || i.mem_operands == 2)
11421         {
11422           as_bad (_("too many memory references for `%s'"),
11423                   current_templates->start->name);
11424           return 0;
11425         }
11426
11427       /* Check for base index form.  We detect the base index form by
11428          looking for an ')' at the end of the operand, searching
11429          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11430          after the '('.  */
11431       base_string = op_string + strlen (op_string);
11432
11433       /* Handle vector operations.  */
11434       vop_start = strchr (op_string, '{');
11435       if (vop_start && vop_start < base_string)
11436         {
11437           if (check_VecOperations (vop_start, base_string) == NULL)
11438             return 0;
11439           base_string = vop_start;
11440         }
11441
11442       --base_string;
11443       if (is_space_char (*base_string))
11444         --base_string;
11445
11446       /* If we only have a displacement, set-up for it to be parsed later.  */
11447       displacement_string_start = op_string;
11448       displacement_string_end = base_string + 1;
11449
11450       if (*base_string == ')')
11451         {
11452           char *temp_string;
11453           unsigned int parens_balanced = 1;
11454           /* We've already checked that the number of left & right ()'s are
11455              equal, so this loop will not be infinite.  */
11456           do
11457             {
11458               base_string--;
11459               if (*base_string == ')')
11460                 parens_balanced++;
11461               if (*base_string == '(')
11462                 parens_balanced--;
11463             }
11464           while (parens_balanced);
11465
11466           temp_string = base_string;
11467
11468           /* Skip past '(' and whitespace.  */
11469           ++base_string;
11470           if (is_space_char (*base_string))
11471             ++base_string;
11472
11473           if (*base_string == ','
11474               || ((i.base_reg = parse_register (base_string, &end_op))
11475                   != NULL))
11476             {
11477               displacement_string_end = temp_string;
11478
11479               i.types[this_operand].bitfield.baseindex = 1;
11480
11481               if (i.base_reg)
11482                 {
11483                   if (i.base_reg == &bad_reg)
11484                     return 0;
11485                   base_string = end_op;
11486                   if (is_space_char (*base_string))
11487                     ++base_string;
11488                 }
11489
11490               /* There may be an index reg or scale factor here.  */
11491               if (*base_string == ',')
11492                 {
11493                   ++base_string;
11494                   if (is_space_char (*base_string))
11495                     ++base_string;
11496
11497                   if ((i.index_reg = parse_register (base_string, &end_op))
11498                       != NULL)
11499                     {
11500                       if (i.index_reg == &bad_reg)
11501                         return 0;
11502                       base_string = end_op;
11503                       if (is_space_char (*base_string))
11504                         ++base_string;
11505                       if (*base_string == ',')
11506                         {
11507                           ++base_string;
11508                           if (is_space_char (*base_string))
11509                             ++base_string;
11510                         }
11511                       else if (*base_string != ')')
11512                         {
11513                           as_bad (_("expecting `,' or `)' "
11514                                     "after index register in `%s'"),
11515                                   operand_string);
11516                           return 0;
11517                         }
11518                     }
11519                   else if (*base_string == REGISTER_PREFIX)
11520                     {
11521                       end_op = strchr (base_string, ',');
11522                       if (end_op)
11523                         *end_op = '\0';
11524                       as_bad (_("bad register name `%s'"), base_string);
11525                       return 0;
11526                     }
11527
11528                   /* Check for scale factor.  */
11529                   if (*base_string != ')')
11530                     {
11531                       char *end_scale = i386_scale (base_string);
11532
11533                       if (!end_scale)
11534                         return 0;
11535
11536                       base_string = end_scale;
11537                       if (is_space_char (*base_string))
11538                         ++base_string;
11539                       if (*base_string != ')')
11540                         {
11541                           as_bad (_("expecting `)' "
11542                                     "after scale factor in `%s'"),
11543                                   operand_string);
11544                           return 0;
11545                         }
11546                     }
11547                   else if (!i.index_reg)
11548                     {
11549                       as_bad (_("expecting index register or scale factor "
11550                                 "after `,'; got '%c'"),
11551                               *base_string);
11552                       return 0;
11553                     }
11554                 }
11555               else if (*base_string != ')')
11556                 {
11557                   as_bad (_("expecting `,' or `)' "
11558                             "after base register in `%s'"),
11559                           operand_string);
11560                   return 0;
11561                 }
11562             }
11563           else if (*base_string == REGISTER_PREFIX)
11564             {
11565               end_op = strchr (base_string, ',');
11566               if (end_op)
11567                 *end_op = '\0';
11568               as_bad (_("bad register name `%s'"), base_string);
11569               return 0;
11570             }
11571         }
11572
11573       /* If there's an expression beginning the operand, parse it,
11574          assuming displacement_string_start and
11575          displacement_string_end are meaningful.  */
11576       if (displacement_string_start != displacement_string_end)
11577         {
11578           if (!i386_displacement (displacement_string_start,
11579                                   displacement_string_end))
11580             return 0;
11581         }
11582
11583       /* Special case for (%dx) while doing input/output op.  */
11584       if (i.base_reg
11585           && i.base_reg->reg_type.bitfield.instance == RegD
11586           && i.base_reg->reg_type.bitfield.word
11587           && i.index_reg == 0
11588           && i.log2_scale_factor == 0
11589           && i.seg[i.mem_operands] == 0
11590           && !operand_type_check (i.types[this_operand], disp))
11591         {
11592           i.types[this_operand] = i.base_reg->reg_type;
11593           return 1;
11594         }
11595
11596       if (i386_index_check (operand_string) == 0)
11597         return 0;
11598       i.flags[this_operand] |= Operand_Mem;
11599       if (i.mem_operands == 0)
11600         i.memop1_string = xstrdup (operand_string);
11601       i.mem_operands++;
11602     }
11603   else
11604     {
11605       /* It's not a memory operand; argh!  */
11606       as_bad (_("invalid char %s beginning operand %d `%s'"),
11607               output_invalid (*op_string),
11608               this_operand + 1,
11609               op_string);
11610       return 0;
11611     }
11612   return 1;                     /* Normal return.  */
11613 }
11614 \f
11615 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11616    that an rs_machine_dependent frag may reach.  */
11617
11618 unsigned int
11619 i386_frag_max_var (fragS *frag)
11620 {
11621   /* The only relaxable frags are for jumps.
11622      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11623   gas_assert (frag->fr_type == rs_machine_dependent);
11624   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11625 }
11626
11627 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11628 static int
11629 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11630 {
11631   /* STT_GNU_IFUNC symbol must go through PLT.  */
11632   if ((symbol_get_bfdsym (fr_symbol)->flags
11633        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11634     return 0;
11635
11636   if (!S_IS_EXTERNAL (fr_symbol))
11637     /* Symbol may be weak or local.  */
11638     return !S_IS_WEAK (fr_symbol);
11639
11640   /* Global symbols with non-default visibility can't be preempted. */
11641   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11642     return 1;
11643
11644   if (fr_var != NO_RELOC)
11645     switch ((enum bfd_reloc_code_real) fr_var)
11646       {
11647       case BFD_RELOC_386_PLT32:
11648       case BFD_RELOC_X86_64_PLT32:
11649         /* Symbol with PLT relocation may be preempted. */
11650         return 0;
11651       default:
11652         abort ();
11653       }
11654
11655   /* Global symbols with default visibility in a shared library may be
11656      preempted by another definition.  */
11657   return !shared;
11658 }
11659 #endif
11660
11661 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11662    Note also work for Skylake and Cascadelake.
11663 ---------------------------------------------------------------------
11664 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11665 | ------  | ----------- | ------- | -------- |
11666 |   Jo    |      N      |    N    |     Y    |
11667 |   Jno   |      N      |    N    |     Y    |
11668 |  Jc/Jb  |      Y      |    N    |     Y    |
11669 | Jae/Jnb |      Y      |    N    |     Y    |
11670 |  Je/Jz  |      Y      |    Y    |     Y    |
11671 | Jne/Jnz |      Y      |    Y    |     Y    |
11672 | Jna/Jbe |      Y      |    N    |     Y    |
11673 | Ja/Jnbe |      Y      |    N    |     Y    |
11674 |   Js    |      N      |    N    |     Y    |
11675 |   Jns   |      N      |    N    |     Y    |
11676 |  Jp/Jpe |      N      |    N    |     Y    |
11677 | Jnp/Jpo |      N      |    N    |     Y    |
11678 | Jl/Jnge |      Y      |    Y    |     Y    |
11679 | Jge/Jnl |      Y      |    Y    |     Y    |
11680 | Jle/Jng |      Y      |    Y    |     Y    |
11681 | Jg/Jnle |      Y      |    Y    |     Y    |
11682 ---------------------------------------------------------------------  */
11683 static int
11684 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11685 {
11686   if (mf_cmp == mf_cmp_alu_cmp)
11687     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11688             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11689   if (mf_cmp == mf_cmp_incdec)
11690     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11691             || mf_jcc == mf_jcc_jle);
11692   if (mf_cmp == mf_cmp_test_and)
11693     return 1;
11694   return 0;
11695 }
11696
11697 /* Return the next non-empty frag.  */
11698
11699 static fragS *
11700 i386_next_non_empty_frag (fragS *fragP)
11701 {
11702   /* There may be a frag with a ".fill 0" when there is no room in
11703      the current frag for frag_grow in output_insn.  */
11704   for (fragP = fragP->fr_next;
11705        (fragP != NULL
11706         && fragP->fr_type == rs_fill
11707         && fragP->fr_fix == 0);
11708        fragP = fragP->fr_next)
11709     ;
11710   return fragP;
11711 }
11712
11713 /* Return the next jcc frag after BRANCH_PADDING.  */
11714
11715 static fragS *
11716 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11717 {
11718   fragS *branch_fragP;
11719   if (!pad_fragP)
11720     return NULL;
11721
11722   if (pad_fragP->fr_type == rs_machine_dependent
11723       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11724           == BRANCH_PADDING))
11725     {
11726       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11727       if (branch_fragP->fr_type != rs_machine_dependent)
11728         return NULL;
11729       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11730           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11731                                    pad_fragP->tc_frag_data.mf_type))
11732         return branch_fragP;
11733     }
11734
11735   return NULL;
11736 }
11737
11738 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11739
11740 static void
11741 i386_classify_machine_dependent_frag (fragS *fragP)
11742 {
11743   fragS *cmp_fragP;
11744   fragS *pad_fragP;
11745   fragS *branch_fragP;
11746   fragS *next_fragP;
11747   unsigned int max_prefix_length;
11748
11749   if (fragP->tc_frag_data.classified)
11750     return;
11751
11752   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11753      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11754   for (next_fragP = fragP;
11755        next_fragP != NULL;
11756        next_fragP = next_fragP->fr_next)
11757     {
11758       next_fragP->tc_frag_data.classified = 1;
11759       if (next_fragP->fr_type == rs_machine_dependent)
11760         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11761           {
11762           case BRANCH_PADDING:
11763             /* The BRANCH_PADDING frag must be followed by a branch
11764                frag.  */
11765             branch_fragP = i386_next_non_empty_frag (next_fragP);
11766             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11767             break;
11768           case FUSED_JCC_PADDING:
11769             /* Check if this is a fused jcc:
11770                FUSED_JCC_PADDING
11771                CMP like instruction
11772                BRANCH_PADDING
11773                COND_JUMP
11774                */
11775             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11776             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11777             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11778             if (branch_fragP)
11779               {
11780                 /* The BRANCH_PADDING frag is merged with the
11781                    FUSED_JCC_PADDING frag.  */
11782                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11783                 /* CMP like instruction size.  */
11784                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11785                 frag_wane (pad_fragP);
11786                 /* Skip to branch_fragP.  */
11787                 next_fragP = branch_fragP;
11788               }
11789             else if (next_fragP->tc_frag_data.max_prefix_length)
11790               {
11791                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11792                    a fused jcc.  */
11793                 next_fragP->fr_subtype
11794                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11795                 next_fragP->tc_frag_data.max_bytes
11796                   = next_fragP->tc_frag_data.max_prefix_length;
11797                 /* This will be updated in the BRANCH_PREFIX scan.  */
11798                 next_fragP->tc_frag_data.max_prefix_length = 0;
11799               }
11800             else
11801               frag_wane (next_fragP);
11802             break;
11803           }
11804     }
11805
11806   /* Stop if there is no BRANCH_PREFIX.  */
11807   if (!align_branch_prefix_size)
11808     return;
11809
11810   /* Scan for BRANCH_PREFIX.  */
11811   for (; fragP != NULL; fragP = fragP->fr_next)
11812     {
11813       if (fragP->fr_type != rs_machine_dependent
11814           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11815               != BRANCH_PREFIX))
11816         continue;
11817
11818       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11819          COND_JUMP_PREFIX.  */
11820       max_prefix_length = 0;
11821       for (next_fragP = fragP;
11822            next_fragP != NULL;
11823            next_fragP = next_fragP->fr_next)
11824         {
11825           if (next_fragP->fr_type == rs_fill)
11826             /* Skip rs_fill frags.  */
11827             continue;
11828           else if (next_fragP->fr_type != rs_machine_dependent)
11829             /* Stop for all other frags.  */
11830             break;
11831
11832           /* rs_machine_dependent frags.  */
11833           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11834               == BRANCH_PREFIX)
11835             {
11836               /* Count BRANCH_PREFIX frags.  */
11837               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11838                 {
11839                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11840                   frag_wane (next_fragP);
11841                 }
11842               else
11843                 max_prefix_length
11844                   += next_fragP->tc_frag_data.max_bytes;
11845             }
11846           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11847                     == BRANCH_PADDING)
11848                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11849                        == FUSED_JCC_PADDING))
11850             {
11851               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11852               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11853               break;
11854             }
11855           else
11856             /* Stop for other rs_machine_dependent frags.  */
11857             break;
11858         }
11859
11860       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11861
11862       /* Skip to the next frag.  */
11863       fragP = next_fragP;
11864     }
11865 }
11866
11867 /* Compute padding size for
11868
11869         FUSED_JCC_PADDING
11870         CMP like instruction
11871         BRANCH_PADDING
11872         COND_JUMP/UNCOND_JUMP
11873
11874    or
11875
11876         BRANCH_PADDING
11877         COND_JUMP/UNCOND_JUMP
11878  */
11879
11880 static int
11881 i386_branch_padding_size (fragS *fragP, offsetT address)
11882 {
11883   unsigned int offset, size, padding_size;
11884   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11885
11886   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11887   if (!address)
11888     address = fragP->fr_address;
11889   address += fragP->fr_fix;
11890
11891   /* CMP like instrunction size.  */
11892   size = fragP->tc_frag_data.cmp_size;
11893
11894   /* The base size of the branch frag.  */
11895   size += branch_fragP->fr_fix;
11896
11897   /* Add opcode and displacement bytes for the rs_machine_dependent
11898      branch frag.  */
11899   if (branch_fragP->fr_type == rs_machine_dependent)
11900     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11901
11902   /* Check if branch is within boundary and doesn't end at the last
11903      byte.  */
11904   offset = address & ((1U << align_branch_power) - 1);
11905   if ((offset + size) >= (1U << align_branch_power))
11906     /* Padding needed to avoid crossing boundary.  */
11907     padding_size = (1U << align_branch_power) - offset;
11908   else
11909     /* No padding needed.  */
11910     padding_size = 0;
11911
11912   /* The return value may be saved in tc_frag_data.length which is
11913      unsigned byte.  */
11914   if (!fits_in_unsigned_byte (padding_size))
11915     abort ();
11916
11917   return padding_size;
11918 }
11919
11920 /* i386_generic_table_relax_frag()
11921
11922    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11923    grow/shrink padding to align branch frags.  Hand others to
11924    relax_frag().  */
11925
11926 long
11927 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11928 {
11929   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11930       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11931     {
11932       long padding_size = i386_branch_padding_size (fragP, 0);
11933       long grow = padding_size - fragP->tc_frag_data.length;
11934
11935       /* When the BRANCH_PREFIX frag is used, the computed address
11936          must match the actual address and there should be no padding.  */
11937       if (fragP->tc_frag_data.padding_address
11938           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11939               || padding_size))
11940         abort ();
11941
11942       /* Update the padding size.  */
11943       if (grow)
11944         fragP->tc_frag_data.length = padding_size;
11945
11946       return grow;
11947     }
11948   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11949     {
11950       fragS *padding_fragP, *next_fragP;
11951       long padding_size, left_size, last_size;
11952
11953       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11954       if (!padding_fragP)
11955         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11956         return (fragP->tc_frag_data.length
11957                 - fragP->tc_frag_data.last_length);
11958
11959       /* Compute the relative address of the padding frag in the very
11960         first time where the BRANCH_PREFIX frag sizes are zero.  */
11961       if (!fragP->tc_frag_data.padding_address)
11962         fragP->tc_frag_data.padding_address
11963           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11964
11965       /* First update the last length from the previous interation.  */
11966       left_size = fragP->tc_frag_data.prefix_length;
11967       for (next_fragP = fragP;
11968            next_fragP != padding_fragP;
11969            next_fragP = next_fragP->fr_next)
11970         if (next_fragP->fr_type == rs_machine_dependent
11971             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11972                 == BRANCH_PREFIX))
11973           {
11974             if (left_size)
11975               {
11976                 int max = next_fragP->tc_frag_data.max_bytes;
11977                 if (max)
11978                   {
11979                     int size;
11980                     if (max > left_size)
11981                       size = left_size;
11982                     else
11983                       size = max;
11984                     left_size -= size;
11985                     next_fragP->tc_frag_data.last_length = size;
11986                   }
11987               }
11988             else
11989               next_fragP->tc_frag_data.last_length = 0;
11990           }
11991
11992       /* Check the padding size for the padding frag.  */
11993       padding_size = i386_branch_padding_size
11994         (padding_fragP, (fragP->fr_address
11995                          + fragP->tc_frag_data.padding_address));
11996
11997       last_size = fragP->tc_frag_data.prefix_length;
11998       /* Check if there is change from the last interation.  */
11999       if (padding_size == last_size)
12000         {
12001           /* Update the expected address of the padding frag.  */
12002           padding_fragP->tc_frag_data.padding_address
12003             = (fragP->fr_address + padding_size
12004                + fragP->tc_frag_data.padding_address);
12005           return 0;
12006         }
12007
12008       if (padding_size > fragP->tc_frag_data.max_prefix_length)
12009         {
12010           /* No padding if there is no sufficient room.  Clear the
12011              expected address of the padding frag.  */
12012           padding_fragP->tc_frag_data.padding_address = 0;
12013           padding_size = 0;
12014         }
12015       else
12016         /* Store the expected address of the padding frag.  */
12017         padding_fragP->tc_frag_data.padding_address
12018           = (fragP->fr_address + padding_size
12019              + fragP->tc_frag_data.padding_address);
12020
12021       fragP->tc_frag_data.prefix_length = padding_size;
12022
12023       /* Update the length for the current interation.  */
12024       left_size = padding_size;
12025       for (next_fragP = fragP;
12026            next_fragP != padding_fragP;
12027            next_fragP = next_fragP->fr_next)
12028         if (next_fragP->fr_type == rs_machine_dependent
12029             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12030                 == BRANCH_PREFIX))
12031           {
12032             if (left_size)
12033               {
12034                 int max = next_fragP->tc_frag_data.max_bytes;
12035                 if (max)
12036                   {
12037                     int size;
12038                     if (max > left_size)
12039                       size = left_size;
12040                     else
12041                       size = max;
12042                     left_size -= size;
12043                     next_fragP->tc_frag_data.length = size;
12044                   }
12045               }
12046             else
12047               next_fragP->tc_frag_data.length = 0;
12048           }
12049
12050       return (fragP->tc_frag_data.length
12051               - fragP->tc_frag_data.last_length);
12052     }
12053   return relax_frag (segment, fragP, stretch);
12054 }
12055
12056 /* md_estimate_size_before_relax()
12057
12058    Called just before relax() for rs_machine_dependent frags.  The x86
12059    assembler uses these frags to handle variable size jump
12060    instructions.
12061
12062    Any symbol that is now undefined will not become defined.
12063    Return the correct fr_subtype in the frag.
12064    Return the initial "guess for variable size of frag" to caller.
12065    The guess is actually the growth beyond the fixed part.  Whatever
12066    we do to grow the fixed or variable part contributes to our
12067    returned value.  */
12068
12069 int
12070 md_estimate_size_before_relax (fragS *fragP, segT segment)
12071 {
12072   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12073       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12074       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12075     {
12076       i386_classify_machine_dependent_frag (fragP);
12077       return fragP->tc_frag_data.length;
12078     }
12079
12080   /* We've already got fragP->fr_subtype right;  all we have to do is
12081      check for un-relaxable symbols.  On an ELF system, we can't relax
12082      an externally visible symbol, because it may be overridden by a
12083      shared library.  */
12084   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12085 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12086       || (IS_ELF
12087           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12088                                                 fragP->fr_var))
12089 #endif
12090 #if defined (OBJ_COFF) && defined (TE_PE)
12091       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12092           && S_IS_WEAK (fragP->fr_symbol))
12093 #endif
12094       )
12095     {
12096       /* Symbol is undefined in this segment, or we need to keep a
12097          reloc so that weak symbols can be overridden.  */
12098       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12099       enum bfd_reloc_code_real reloc_type;
12100       unsigned char *opcode;
12101       int old_fr_fix;
12102
12103       if (fragP->fr_var != NO_RELOC)
12104         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12105       else if (size == 2)
12106         reloc_type = BFD_RELOC_16_PCREL;
12107 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12108       else if (need_plt32_p (fragP->fr_symbol))
12109         reloc_type = BFD_RELOC_X86_64_PLT32;
12110 #endif
12111       else
12112         reloc_type = BFD_RELOC_32_PCREL;
12113
12114       old_fr_fix = fragP->fr_fix;
12115       opcode = (unsigned char *) fragP->fr_opcode;
12116
12117       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12118         {
12119         case UNCOND_JUMP:
12120           /* Make jmp (0xeb) a (d)word displacement jump.  */
12121           opcode[0] = 0xe9;
12122           fragP->fr_fix += size;
12123           fix_new (fragP, old_fr_fix, size,
12124                    fragP->fr_symbol,
12125                    fragP->fr_offset, 1,
12126                    reloc_type);
12127           break;
12128
12129         case COND_JUMP86:
12130           if (size == 2
12131               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12132             {
12133               /* Negate the condition, and branch past an
12134                  unconditional jump.  */
12135               opcode[0] ^= 1;
12136               opcode[1] = 3;
12137               /* Insert an unconditional jump.  */
12138               opcode[2] = 0xe9;
12139               /* We added two extra opcode bytes, and have a two byte
12140                  offset.  */
12141               fragP->fr_fix += 2 + 2;
12142               fix_new (fragP, old_fr_fix + 2, 2,
12143                        fragP->fr_symbol,
12144                        fragP->fr_offset, 1,
12145                        reloc_type);
12146               break;
12147             }
12148           /* Fall through.  */
12149
12150         case COND_JUMP:
12151           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12152             {
12153               fixS *fixP;
12154
12155               fragP->fr_fix += 1;
12156               fixP = fix_new (fragP, old_fr_fix, 1,
12157                               fragP->fr_symbol,
12158                               fragP->fr_offset, 1,
12159                               BFD_RELOC_8_PCREL);
12160               fixP->fx_signed = 1;
12161               break;
12162             }
12163
12164           /* This changes the byte-displacement jump 0x7N
12165              to the (d)word-displacement jump 0x0f,0x8N.  */
12166           opcode[1] = opcode[0] + 0x10;
12167           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12168           /* We've added an opcode byte.  */
12169           fragP->fr_fix += 1 + size;
12170           fix_new (fragP, old_fr_fix + 1, size,
12171                    fragP->fr_symbol,
12172                    fragP->fr_offset, 1,
12173                    reloc_type);
12174           break;
12175
12176         default:
12177           BAD_CASE (fragP->fr_subtype);
12178           break;
12179         }
12180       frag_wane (fragP);
12181       return fragP->fr_fix - old_fr_fix;
12182     }
12183
12184   /* Guess size depending on current relax state.  Initially the relax
12185      state will correspond to a short jump and we return 1, because
12186      the variable part of the frag (the branch offset) is one byte
12187      long.  However, we can relax a section more than once and in that
12188      case we must either set fr_subtype back to the unrelaxed state,
12189      or return the value for the appropriate branch.  */
12190   return md_relax_table[fragP->fr_subtype].rlx_length;
12191 }
12192
12193 /* Called after relax() is finished.
12194
12195    In:  Address of frag.
12196         fr_type == rs_machine_dependent.
12197         fr_subtype is what the address relaxed to.
12198
12199    Out: Any fixSs and constants are set up.
12200         Caller will turn frag into a ".space 0".  */
12201
12202 void
12203 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12204                  fragS *fragP)
12205 {
12206   unsigned char *opcode;
12207   unsigned char *where_to_put_displacement = NULL;
12208   offsetT target_address;
12209   offsetT opcode_address;
12210   unsigned int extension = 0;
12211   offsetT displacement_from_opcode_start;
12212
12213   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12214       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12215       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12216     {
12217       /* Generate nop padding.  */
12218       unsigned int size = fragP->tc_frag_data.length;
12219       if (size)
12220         {
12221           if (size > fragP->tc_frag_data.max_bytes)
12222             abort ();
12223
12224           if (flag_debug)
12225             {
12226               const char *msg;
12227               const char *branch = "branch";
12228               const char *prefix = "";
12229               fragS *padding_fragP;
12230               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12231                   == BRANCH_PREFIX)
12232                 {
12233                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12234                   switch (fragP->tc_frag_data.default_prefix)
12235                     {
12236                     default:
12237                       abort ();
12238                       break;
12239                     case CS_PREFIX_OPCODE:
12240                       prefix = " cs";
12241                       break;
12242                     case DS_PREFIX_OPCODE:
12243                       prefix = " ds";
12244                       break;
12245                     case ES_PREFIX_OPCODE:
12246                       prefix = " es";
12247                       break;
12248                     case FS_PREFIX_OPCODE:
12249                       prefix = " fs";
12250                       break;
12251                     case GS_PREFIX_OPCODE:
12252                       prefix = " gs";
12253                       break;
12254                     case SS_PREFIX_OPCODE:
12255                       prefix = " ss";
12256                       break;
12257                     }
12258                   if (padding_fragP)
12259                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12260                             "%s within %d-byte boundary\n");
12261                   else
12262                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12263                             "align %s within %d-byte boundary\n");
12264                 }
12265               else
12266                 {
12267                   padding_fragP = fragP;
12268                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12269                           "%s within %d-byte boundary\n");
12270                 }
12271
12272               if (padding_fragP)
12273                 switch (padding_fragP->tc_frag_data.branch_type)
12274                   {
12275                   case align_branch_jcc:
12276                     branch = "jcc";
12277                     break;
12278                   case align_branch_fused:
12279                     branch = "fused jcc";
12280                     break;
12281                   case align_branch_jmp:
12282                     branch = "jmp";
12283                     break;
12284                   case align_branch_call:
12285                     branch = "call";
12286                     break;
12287                   case align_branch_indirect:
12288                     branch = "indiret branch";
12289                     break;
12290                   case align_branch_ret:
12291                     branch = "ret";
12292                     break;
12293                   default:
12294                     break;
12295                   }
12296
12297               fprintf (stdout, msg,
12298                        fragP->fr_file, fragP->fr_line, size, prefix,
12299                        (long long) fragP->fr_address, branch,
12300                        1 << align_branch_power);
12301             }
12302           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12303             memset (fragP->fr_opcode,
12304                     fragP->tc_frag_data.default_prefix, size);
12305           else
12306             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12307                                 size, 0);
12308           fragP->fr_fix += size;
12309         }
12310       return;
12311     }
12312
12313   opcode = (unsigned char *) fragP->fr_opcode;
12314
12315   /* Address we want to reach in file space.  */
12316   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12317
12318   /* Address opcode resides at in file space.  */
12319   opcode_address = fragP->fr_address + fragP->fr_fix;
12320
12321   /* Displacement from opcode start to fill into instruction.  */
12322   displacement_from_opcode_start = target_address - opcode_address;
12323
12324   if ((fragP->fr_subtype & BIG) == 0)
12325     {
12326       /* Don't have to change opcode.  */
12327       extension = 1;            /* 1 opcode + 1 displacement  */
12328       where_to_put_displacement = &opcode[1];
12329     }
12330   else
12331     {
12332       if (no_cond_jump_promotion
12333           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12334         as_warn_where (fragP->fr_file, fragP->fr_line,
12335                        _("long jump required"));
12336
12337       switch (fragP->fr_subtype)
12338         {
12339         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12340           extension = 4;                /* 1 opcode + 4 displacement  */
12341           opcode[0] = 0xe9;
12342           where_to_put_displacement = &opcode[1];
12343           break;
12344
12345         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12346           extension = 2;                /* 1 opcode + 2 displacement  */
12347           opcode[0] = 0xe9;
12348           where_to_put_displacement = &opcode[1];
12349           break;
12350
12351         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12352         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12353           extension = 5;                /* 2 opcode + 4 displacement  */
12354           opcode[1] = opcode[0] + 0x10;
12355           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12356           where_to_put_displacement = &opcode[2];
12357           break;
12358
12359         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12360           extension = 3;                /* 2 opcode + 2 displacement  */
12361           opcode[1] = opcode[0] + 0x10;
12362           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12363           where_to_put_displacement = &opcode[2];
12364           break;
12365
12366         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12367           extension = 4;
12368           opcode[0] ^= 1;
12369           opcode[1] = 3;
12370           opcode[2] = 0xe9;
12371           where_to_put_displacement = &opcode[3];
12372           break;
12373
12374         default:
12375           BAD_CASE (fragP->fr_subtype);
12376           break;
12377         }
12378     }
12379
12380   /* If size if less then four we are sure that the operand fits,
12381      but if it's 4, then it could be that the displacement is larger
12382      then -/+ 2GB.  */
12383   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12384       && object_64bit
12385       && ((addressT) (displacement_from_opcode_start - extension
12386                       + ((addressT) 1 << 31))
12387           > (((addressT) 2 << 31) - 1)))
12388     {
12389       as_bad_where (fragP->fr_file, fragP->fr_line,
12390                     _("jump target out of range"));
12391       /* Make us emit 0.  */
12392       displacement_from_opcode_start = extension;
12393     }
12394   /* Now put displacement after opcode.  */
12395   md_number_to_chars ((char *) where_to_put_displacement,
12396                       (valueT) (displacement_from_opcode_start - extension),
12397                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12398   fragP->fr_fix += extension;
12399 }
12400 \f
12401 /* Apply a fixup (fixP) to segment data, once it has been determined
12402    by our caller that we have all the info we need to fix it up.
12403
12404    Parameter valP is the pointer to the value of the bits.
12405
12406    On the 386, immediates, displacements, and data pointers are all in
12407    the same (little-endian) format, so we don't need to care about which
12408    we are handling.  */
12409
12410 void
12411 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12412 {
12413   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12414   valueT value = *valP;
12415
12416 #if !defined (TE_Mach)
12417   if (fixP->fx_pcrel)
12418     {
12419       switch (fixP->fx_r_type)
12420         {
12421         default:
12422           break;
12423
12424         case BFD_RELOC_64:
12425           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12426           break;
12427         case BFD_RELOC_32:
12428         case BFD_RELOC_X86_64_32S:
12429           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12430           break;
12431         case BFD_RELOC_16:
12432           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12433           break;
12434         case BFD_RELOC_8:
12435           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12436           break;
12437         }
12438     }
12439
12440   if (fixP->fx_addsy != NULL
12441       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12442           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12443           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12444           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12445       && !use_rela_relocations)
12446     {
12447       /* This is a hack.  There should be a better way to handle this.
12448          This covers for the fact that bfd_install_relocation will
12449          subtract the current location (for partial_inplace, PC relative
12450          relocations); see more below.  */
12451 #ifndef OBJ_AOUT
12452       if (IS_ELF
12453 #ifdef TE_PE
12454           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12455 #endif
12456           )
12457         value += fixP->fx_where + fixP->fx_frag->fr_address;
12458 #endif
12459 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12460       if (IS_ELF)
12461         {
12462           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12463
12464           if ((sym_seg == seg
12465                || (symbol_section_p (fixP->fx_addsy)
12466                    && sym_seg != absolute_section))
12467               && !generic_force_reloc (fixP))
12468             {
12469               /* Yes, we add the values in twice.  This is because
12470                  bfd_install_relocation subtracts them out again.  I think
12471                  bfd_install_relocation is broken, but I don't dare change
12472                  it.  FIXME.  */
12473               value += fixP->fx_where + fixP->fx_frag->fr_address;
12474             }
12475         }
12476 #endif
12477 #if defined (OBJ_COFF) && defined (TE_PE)
12478       /* For some reason, the PE format does not store a
12479          section address offset for a PC relative symbol.  */
12480       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12481           || S_IS_WEAK (fixP->fx_addsy))
12482         value += md_pcrel_from (fixP);
12483 #endif
12484     }
12485 #if defined (OBJ_COFF) && defined (TE_PE)
12486   if (fixP->fx_addsy != NULL
12487       && S_IS_WEAK (fixP->fx_addsy)
12488       /* PR 16858: Do not modify weak function references.  */
12489       && ! fixP->fx_pcrel)
12490     {
12491 #if !defined (TE_PEP)
12492       /* For x86 PE weak function symbols are neither PC-relative
12493          nor do they set S_IS_FUNCTION.  So the only reliable way
12494          to detect them is to check the flags of their containing
12495          section.  */
12496       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12497           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12498         ;
12499       else
12500 #endif
12501       value -= S_GET_VALUE (fixP->fx_addsy);
12502     }
12503 #endif
12504
12505   /* Fix a few things - the dynamic linker expects certain values here,
12506      and we must not disappoint it.  */
12507 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12508   if (IS_ELF && fixP->fx_addsy)
12509     switch (fixP->fx_r_type)
12510       {
12511       case BFD_RELOC_386_PLT32:
12512       case BFD_RELOC_X86_64_PLT32:
12513         /* Make the jump instruction point to the address of the operand.
12514            At runtime we merely add the offset to the actual PLT entry.
12515            NB: Subtract the offset size only for jump instructions.  */
12516         if (fixP->fx_pcrel)
12517           value = -4;
12518         break;
12519
12520       case BFD_RELOC_386_TLS_GD:
12521       case BFD_RELOC_386_TLS_LDM:
12522       case BFD_RELOC_386_TLS_IE_32:
12523       case BFD_RELOC_386_TLS_IE:
12524       case BFD_RELOC_386_TLS_GOTIE:
12525       case BFD_RELOC_386_TLS_GOTDESC:
12526       case BFD_RELOC_X86_64_TLSGD:
12527       case BFD_RELOC_X86_64_TLSLD:
12528       case BFD_RELOC_X86_64_GOTTPOFF:
12529       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12530         value = 0; /* Fully resolved at runtime.  No addend.  */
12531         /* Fallthrough */
12532       case BFD_RELOC_386_TLS_LE:
12533       case BFD_RELOC_386_TLS_LDO_32:
12534       case BFD_RELOC_386_TLS_LE_32:
12535       case BFD_RELOC_X86_64_DTPOFF32:
12536       case BFD_RELOC_X86_64_DTPOFF64:
12537       case BFD_RELOC_X86_64_TPOFF32:
12538       case BFD_RELOC_X86_64_TPOFF64:
12539         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12540         break;
12541
12542       case BFD_RELOC_386_TLS_DESC_CALL:
12543       case BFD_RELOC_X86_64_TLSDESC_CALL:
12544         value = 0; /* Fully resolved at runtime.  No addend.  */
12545         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12546         fixP->fx_done = 0;
12547         return;
12548
12549       case BFD_RELOC_VTABLE_INHERIT:
12550       case BFD_RELOC_VTABLE_ENTRY:
12551         fixP->fx_done = 0;
12552         return;
12553
12554       default:
12555         break;
12556       }
12557 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12558   *valP = value;
12559 #endif /* !defined (TE_Mach)  */
12560
12561   /* Are we finished with this relocation now?  */
12562   if (fixP->fx_addsy == NULL)
12563     fixP->fx_done = 1;
12564 #if defined (OBJ_COFF) && defined (TE_PE)
12565   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12566     {
12567       fixP->fx_done = 0;
12568       /* Remember value for tc_gen_reloc.  */
12569       fixP->fx_addnumber = value;
12570       /* Clear out the frag for now.  */
12571       value = 0;
12572     }
12573 #endif
12574   else if (use_rela_relocations)
12575     {
12576       fixP->fx_no_overflow = 1;
12577       /* Remember value for tc_gen_reloc.  */
12578       fixP->fx_addnumber = value;
12579       value = 0;
12580     }
12581
12582   md_number_to_chars (p, value, fixP->fx_size);
12583 }
12584 \f
12585 const char *
12586 md_atof (int type, char *litP, int *sizeP)
12587 {
12588   /* This outputs the LITTLENUMs in REVERSE order;
12589      in accord with the bigendian 386.  */
12590   return ieee_md_atof (type, litP, sizeP, FALSE);
12591 }
12592 \f
12593 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12594
12595 static char *
12596 output_invalid (int c)
12597 {
12598   if (ISPRINT (c))
12599     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12600               "'%c'", c);
12601   else
12602     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12603               "(0x%x)", (unsigned char) c);
12604   return output_invalid_buf;
12605 }
12606
12607 /* Verify that @r can be used in the current context.  */
12608
12609 static bfd_boolean check_register (const reg_entry *r)
12610 {
12611   if (allow_pseudo_reg)
12612     return TRUE;
12613
12614   if (operand_type_all_zero (&r->reg_type))
12615     return FALSE;
12616
12617   if ((r->reg_type.bitfield.dword
12618        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12619        || r->reg_type.bitfield.class == RegCR
12620        || r->reg_type.bitfield.class == RegDR)
12621       && !cpu_arch_flags.bitfield.cpui386)
12622     return FALSE;
12623
12624   if (r->reg_type.bitfield.class == RegTR
12625       && (flag_code == CODE_64BIT
12626           || !cpu_arch_flags.bitfield.cpui386
12627           || cpu_arch_isa_flags.bitfield.cpui586
12628           || cpu_arch_isa_flags.bitfield.cpui686))
12629     return FALSE;
12630
12631   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12632     return FALSE;
12633
12634   if (!cpu_arch_flags.bitfield.cpuavx512f)
12635     {
12636       if (r->reg_type.bitfield.zmmword
12637           || r->reg_type.bitfield.class == RegMask)
12638         return FALSE;
12639
12640       if (!cpu_arch_flags.bitfield.cpuavx)
12641         {
12642           if (r->reg_type.bitfield.ymmword)
12643             return FALSE;
12644
12645           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12646             return FALSE;
12647         }
12648     }
12649
12650   if (r->reg_type.bitfield.tmmword
12651       && (!cpu_arch_flags.bitfield.cpuamx_tile
12652           || flag_code != CODE_64BIT))
12653     return FALSE;
12654
12655   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12656     return FALSE;
12657
12658   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12659   if (!allow_index_reg && r->reg_num == RegIZ)
12660     return FALSE;
12661
12662   /* Upper 16 vector registers are only available with VREX in 64bit
12663      mode, and require EVEX encoding.  */
12664   if (r->reg_flags & RegVRex)
12665     {
12666       if (!cpu_arch_flags.bitfield.cpuavx512f
12667           || flag_code != CODE_64BIT)
12668         return FALSE;
12669
12670       if (i.vec_encoding == vex_encoding_default)
12671         i.vec_encoding = vex_encoding_evex;
12672       else if (i.vec_encoding != vex_encoding_evex)
12673         i.vec_encoding = vex_encoding_error;
12674     }
12675
12676   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12677       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12678       && flag_code != CODE_64BIT)
12679     return FALSE;
12680
12681   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12682       && !intel_syntax)
12683     return FALSE;
12684
12685   return TRUE;
12686 }
12687
12688 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12689
12690 static const reg_entry *
12691 parse_real_register (char *reg_string, char **end_op)
12692 {
12693   char *s = reg_string;
12694   char *p;
12695   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12696   const reg_entry *r;
12697
12698   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12699   if (*s == REGISTER_PREFIX)
12700     ++s;
12701
12702   if (is_space_char (*s))
12703     ++s;
12704
12705   p = reg_name_given;
12706   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12707     {
12708       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12709         return (const reg_entry *) NULL;
12710       s++;
12711     }
12712
12713   /* For naked regs, make sure that we are not dealing with an identifier.
12714      This prevents confusing an identifier like `eax_var' with register
12715      `eax'.  */
12716   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12717     return (const reg_entry *) NULL;
12718
12719   *end_op = s;
12720
12721   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12722
12723   /* Handle floating point regs, allowing spaces in the (i) part.  */
12724   if (r == i386_regtab /* %st is first entry of table  */)
12725     {
12726       if (!cpu_arch_flags.bitfield.cpu8087
12727           && !cpu_arch_flags.bitfield.cpu287
12728           && !cpu_arch_flags.bitfield.cpu387
12729           && !allow_pseudo_reg)
12730         return (const reg_entry *) NULL;
12731
12732       if (is_space_char (*s))
12733         ++s;
12734       if (*s == '(')
12735         {
12736           ++s;
12737           if (is_space_char (*s))
12738             ++s;
12739           if (*s >= '0' && *s <= '7')
12740             {
12741               int fpr = *s - '0';
12742               ++s;
12743               if (is_space_char (*s))
12744                 ++s;
12745               if (*s == ')')
12746                 {
12747                   *end_op = s + 1;
12748                   r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12749                   know (r);
12750                   return r + fpr;
12751                 }
12752             }
12753           /* We have "%st(" then garbage.  */
12754           return (const reg_entry *) NULL;
12755         }
12756     }
12757
12758   return r && check_register (r) ? r : NULL;
12759 }
12760
12761 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12762
12763 static const reg_entry *
12764 parse_register (char *reg_string, char **end_op)
12765 {
12766   const reg_entry *r;
12767
12768   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12769     r = parse_real_register (reg_string, end_op);
12770   else
12771     r = NULL;
12772   if (!r)
12773     {
12774       char *save = input_line_pointer;
12775       char c;
12776       symbolS *symbolP;
12777
12778       input_line_pointer = reg_string;
12779       c = get_symbol_name (&reg_string);
12780       symbolP = symbol_find (reg_string);
12781       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12782         {
12783           const expressionS *e = symbol_get_value_expression (symbolP);
12784
12785           know (e->X_op == O_register);
12786           know (e->X_add_number >= 0
12787                 && (valueT) e->X_add_number < i386_regtab_size);
12788           r = i386_regtab + e->X_add_number;
12789           if (!check_register (r))
12790             {
12791               as_bad (_("register '%s%s' cannot be used here"),
12792                       register_prefix, r->reg_name);
12793               r = &bad_reg;
12794             }
12795           *end_op = input_line_pointer;
12796         }
12797       *input_line_pointer = c;
12798       input_line_pointer = save;
12799     }
12800   return r;
12801 }
12802
12803 int
12804 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12805 {
12806   const reg_entry *r;
12807   char *end = input_line_pointer;
12808
12809   *end = *nextcharP;
12810   r = parse_register (name, &input_line_pointer);
12811   if (r && end <= input_line_pointer)
12812     {
12813       *nextcharP = *input_line_pointer;
12814       *input_line_pointer = 0;
12815       if (r != &bad_reg)
12816         {
12817           e->X_op = O_register;
12818           e->X_add_number = r - i386_regtab;
12819         }
12820       else
12821           e->X_op = O_illegal;
12822       return 1;
12823     }
12824   input_line_pointer = end;
12825   *end = 0;
12826   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12827 }
12828
12829 void
12830 md_operand (expressionS *e)
12831 {
12832   char *end;
12833   const reg_entry *r;
12834
12835   switch (*input_line_pointer)
12836     {
12837     case REGISTER_PREFIX:
12838       r = parse_real_register (input_line_pointer, &end);
12839       if (r)
12840         {
12841           e->X_op = O_register;
12842           e->X_add_number = r - i386_regtab;
12843           input_line_pointer = end;
12844         }
12845       break;
12846
12847     case '[':
12848       gas_assert (intel_syntax);
12849       end = input_line_pointer++;
12850       expression (e);
12851       if (*input_line_pointer == ']')
12852         {
12853           ++input_line_pointer;
12854           e->X_op_symbol = make_expr_symbol (e);
12855           e->X_add_symbol = NULL;
12856           e->X_add_number = 0;
12857           e->X_op = O_index;
12858         }
12859       else
12860         {
12861           e->X_op = O_absent;
12862           input_line_pointer = end;
12863         }
12864       break;
12865     }
12866 }
12867
12868 \f
12869 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12870 const char *md_shortopts = "kVQ:sqnO::";
12871 #else
12872 const char *md_shortopts = "qnO::";
12873 #endif
12874
12875 #define OPTION_32 (OPTION_MD_BASE + 0)
12876 #define OPTION_64 (OPTION_MD_BASE + 1)
12877 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12878 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12879 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12880 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12881 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12882 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12883 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12884 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12885 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12886 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12887 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12888 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12889 #define OPTION_X32 (OPTION_MD_BASE + 14)
12890 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12891 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12892 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12893 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12894 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12895 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12896 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12897 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12898 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12899 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12900 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12901 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12902 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12903 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12904 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12905 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12906 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12907 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12908 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12909
12910 struct option md_longopts[] =
12911 {
12912   {"32", no_argument, NULL, OPTION_32},
12913 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12914      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12915   {"64", no_argument, NULL, OPTION_64},
12916 #endif
12917 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12918   {"x32", no_argument, NULL, OPTION_X32},
12919   {"mshared", no_argument, NULL, OPTION_MSHARED},
12920   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12921 #endif
12922   {"divide", no_argument, NULL, OPTION_DIVIDE},
12923   {"march", required_argument, NULL, OPTION_MARCH},
12924   {"mtune", required_argument, NULL, OPTION_MTUNE},
12925   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12926   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12927   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12928   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12929   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12930   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12931   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12932   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12933   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12934   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12935   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12936   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12937 # if defined (TE_PE) || defined (TE_PEP)
12938   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12939 #endif
12940   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12941   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12942   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12943   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12944   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12945   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12946   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12947   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12948   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12949   {"mlfence-before-indirect-branch", required_argument, NULL,
12950    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12951   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12952   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12953   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12954   {NULL, no_argument, NULL, 0}
12955 };
12956 size_t md_longopts_size = sizeof (md_longopts);
12957
12958 int
12959 md_parse_option (int c, const char *arg)
12960 {
12961   unsigned int j;
12962   char *arch, *next, *saved, *type;
12963
12964   switch (c)
12965     {
12966     case 'n':
12967       optimize_align_code = 0;
12968       break;
12969
12970     case 'q':
12971       quiet_warnings = 1;
12972       break;
12973
12974 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12975       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12976          should be emitted or not.  FIXME: Not implemented.  */
12977     case 'Q':
12978       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12979         return 0;
12980       break;
12981
12982       /* -V: SVR4 argument to print version ID.  */
12983     case 'V':
12984       print_version_id ();
12985       break;
12986
12987       /* -k: Ignore for FreeBSD compatibility.  */
12988     case 'k':
12989       break;
12990
12991     case 's':
12992       /* -s: On i386 Solaris, this tells the native assembler to use
12993          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12994       break;
12995
12996     case OPTION_MSHARED:
12997       shared = 1;
12998       break;
12999
13000     case OPTION_X86_USED_NOTE:
13001       if (strcasecmp (arg, "yes") == 0)
13002         x86_used_note = 1;
13003       else if (strcasecmp (arg, "no") == 0)
13004         x86_used_note = 0;
13005       else
13006         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
13007       break;
13008
13009
13010 #endif
13011 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13012      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13013     case OPTION_64:
13014       {
13015         const char **list, **l;
13016
13017         list = bfd_target_list ();
13018         for (l = list; *l != NULL; l++)
13019           if (CONST_STRNEQ (*l, "elf64-x86-64")
13020               || strcmp (*l, "coff-x86-64") == 0
13021               || strcmp (*l, "pe-x86-64") == 0
13022               || strcmp (*l, "pei-x86-64") == 0
13023               || strcmp (*l, "mach-o-x86-64") == 0)
13024             {
13025               default_arch = "x86_64";
13026               break;
13027             }
13028         if (*l == NULL)
13029           as_fatal (_("no compiled in support for x86_64"));
13030         free (list);
13031       }
13032       break;
13033 #endif
13034
13035 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13036     case OPTION_X32:
13037       if (IS_ELF)
13038         {
13039           const char **list, **l;
13040
13041           list = bfd_target_list ();
13042           for (l = list; *l != NULL; l++)
13043             if (CONST_STRNEQ (*l, "elf32-x86-64"))
13044               {
13045                 default_arch = "x86_64:32";
13046                 break;
13047               }
13048           if (*l == NULL)
13049             as_fatal (_("no compiled in support for 32bit x86_64"));
13050           free (list);
13051         }
13052       else
13053         as_fatal (_("32bit x86_64 is only supported for ELF"));
13054       break;
13055 #endif
13056
13057     case OPTION_32:
13058       default_arch = "i386";
13059       break;
13060
13061     case OPTION_DIVIDE:
13062 #ifdef SVR4_COMMENT_CHARS
13063       {
13064         char *n, *t;
13065         const char *s;
13066
13067         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13068         t = n;
13069         for (s = i386_comment_chars; *s != '\0'; s++)
13070           if (*s != '/')
13071             *t++ = *s;
13072         *t = '\0';
13073         i386_comment_chars = n;
13074       }
13075 #endif
13076       break;
13077
13078     case OPTION_MARCH:
13079       saved = xstrdup (arg);
13080       arch = saved;
13081       /* Allow -march=+nosse.  */
13082       if (*arch == '+')
13083         arch++;
13084       do
13085         {
13086           if (*arch == '.')
13087             as_fatal (_("invalid -march= option: `%s'"), arg);
13088           next = strchr (arch, '+');
13089           if (next)
13090             *next++ = '\0';
13091           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13092             {
13093               if (strcmp (arch, cpu_arch [j].name) == 0)
13094                 {
13095                   /* Processor.  */
13096                   if (! cpu_arch[j].flags.bitfield.cpui386)
13097                     continue;
13098
13099                   cpu_arch_name = cpu_arch[j].name;
13100                   cpu_sub_arch_name = NULL;
13101                   cpu_arch_flags = cpu_arch[j].flags;
13102                   cpu_arch_isa = cpu_arch[j].type;
13103                   cpu_arch_isa_flags = cpu_arch[j].flags;
13104                   if (!cpu_arch_tune_set)
13105                     {
13106                       cpu_arch_tune = cpu_arch_isa;
13107                       cpu_arch_tune_flags = cpu_arch_isa_flags;
13108                     }
13109                   break;
13110                 }
13111               else if (*cpu_arch [j].name == '.'
13112                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
13113                 {
13114                   /* ISA extension.  */
13115                   i386_cpu_flags flags;
13116
13117                   flags = cpu_flags_or (cpu_arch_flags,
13118                                         cpu_arch[j].flags);
13119
13120                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13121                     {
13122                       if (cpu_sub_arch_name)
13123                         {
13124                           char *name = cpu_sub_arch_name;
13125                           cpu_sub_arch_name = concat (name,
13126                                                       cpu_arch[j].name,
13127                                                       (const char *) NULL);
13128                           free (name);
13129                         }
13130                       else
13131                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13132                       cpu_arch_flags = flags;
13133                       cpu_arch_isa_flags = flags;
13134                     }
13135                   else
13136                     cpu_arch_isa_flags
13137                       = cpu_flags_or (cpu_arch_isa_flags,
13138                                       cpu_arch[j].flags);
13139                   break;
13140                 }
13141             }
13142
13143           if (j >= ARRAY_SIZE (cpu_arch))
13144             {
13145               /* Disable an ISA extension.  */
13146               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13147                 if (strcmp (arch, cpu_noarch [j].name) == 0)
13148                   {
13149                     i386_cpu_flags flags;
13150
13151                     flags = cpu_flags_and_not (cpu_arch_flags,
13152                                                cpu_noarch[j].flags);
13153                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13154                       {
13155                         if (cpu_sub_arch_name)
13156                           {
13157                             char *name = cpu_sub_arch_name;
13158                             cpu_sub_arch_name = concat (arch,
13159                                                         (const char *) NULL);
13160                             free (name);
13161                           }
13162                         else
13163                           cpu_sub_arch_name = xstrdup (arch);
13164                         cpu_arch_flags = flags;
13165                         cpu_arch_isa_flags = flags;
13166                       }
13167                     break;
13168                   }
13169
13170               if (j >= ARRAY_SIZE (cpu_noarch))
13171                 j = ARRAY_SIZE (cpu_arch);
13172             }
13173
13174           if (j >= ARRAY_SIZE (cpu_arch))
13175             as_fatal (_("invalid -march= option: `%s'"), arg);
13176
13177           arch = next;
13178         }
13179       while (next != NULL);
13180       free (saved);
13181       break;
13182
13183     case OPTION_MTUNE:
13184       if (*arg == '.')
13185         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13186       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13187         {
13188           if (strcmp (arg, cpu_arch [j].name) == 0)
13189             {
13190               cpu_arch_tune_set = 1;
13191               cpu_arch_tune = cpu_arch [j].type;
13192               cpu_arch_tune_flags = cpu_arch[j].flags;
13193               break;
13194             }
13195         }
13196       if (j >= ARRAY_SIZE (cpu_arch))
13197         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13198       break;
13199
13200     case OPTION_MMNEMONIC:
13201       if (strcasecmp (arg, "att") == 0)
13202         intel_mnemonic = 0;
13203       else if (strcasecmp (arg, "intel") == 0)
13204         intel_mnemonic = 1;
13205       else
13206         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13207       break;
13208
13209     case OPTION_MSYNTAX:
13210       if (strcasecmp (arg, "att") == 0)
13211         intel_syntax = 0;
13212       else if (strcasecmp (arg, "intel") == 0)
13213         intel_syntax = 1;
13214       else
13215         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13216       break;
13217
13218     case OPTION_MINDEX_REG:
13219       allow_index_reg = 1;
13220       break;
13221
13222     case OPTION_MNAKED_REG:
13223       allow_naked_reg = 1;
13224       break;
13225
13226     case OPTION_MSSE2AVX:
13227       sse2avx = 1;
13228       break;
13229
13230     case OPTION_MSSE_CHECK:
13231       if (strcasecmp (arg, "error") == 0)
13232         sse_check = check_error;
13233       else if (strcasecmp (arg, "warning") == 0)
13234         sse_check = check_warning;
13235       else if (strcasecmp (arg, "none") == 0)
13236         sse_check = check_none;
13237       else
13238         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13239       break;
13240
13241     case OPTION_MOPERAND_CHECK:
13242       if (strcasecmp (arg, "error") == 0)
13243         operand_check = check_error;
13244       else if (strcasecmp (arg, "warning") == 0)
13245         operand_check = check_warning;
13246       else if (strcasecmp (arg, "none") == 0)
13247         operand_check = check_none;
13248       else
13249         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13250       break;
13251
13252     case OPTION_MAVXSCALAR:
13253       if (strcasecmp (arg, "128") == 0)
13254         avxscalar = vex128;
13255       else if (strcasecmp (arg, "256") == 0)
13256         avxscalar = vex256;
13257       else
13258         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13259       break;
13260
13261     case OPTION_MVEXWIG:
13262       if (strcmp (arg, "0") == 0)
13263         vexwig = vexw0;
13264       else if (strcmp (arg, "1") == 0)
13265         vexwig = vexw1;
13266       else
13267         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13268       break;
13269
13270     case OPTION_MADD_BND_PREFIX:
13271       add_bnd_prefix = 1;
13272       break;
13273
13274     case OPTION_MEVEXLIG:
13275       if (strcmp (arg, "128") == 0)
13276         evexlig = evexl128;
13277       else if (strcmp (arg, "256") == 0)
13278         evexlig = evexl256;
13279       else  if (strcmp (arg, "512") == 0)
13280         evexlig = evexl512;
13281       else
13282         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13283       break;
13284
13285     case OPTION_MEVEXRCIG:
13286       if (strcmp (arg, "rne") == 0)
13287         evexrcig = rne;
13288       else if (strcmp (arg, "rd") == 0)
13289         evexrcig = rd;
13290       else if (strcmp (arg, "ru") == 0)
13291         evexrcig = ru;
13292       else if (strcmp (arg, "rz") == 0)
13293         evexrcig = rz;
13294       else
13295         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13296       break;
13297
13298     case OPTION_MEVEXWIG:
13299       if (strcmp (arg, "0") == 0)
13300         evexwig = evexw0;
13301       else if (strcmp (arg, "1") == 0)
13302         evexwig = evexw1;
13303       else
13304         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13305       break;
13306
13307 # if defined (TE_PE) || defined (TE_PEP)
13308     case OPTION_MBIG_OBJ:
13309       use_big_obj = 1;
13310       break;
13311 #endif
13312
13313     case OPTION_MOMIT_LOCK_PREFIX:
13314       if (strcasecmp (arg, "yes") == 0)
13315         omit_lock_prefix = 1;
13316       else if (strcasecmp (arg, "no") == 0)
13317         omit_lock_prefix = 0;
13318       else
13319         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13320       break;
13321
13322     case OPTION_MFENCE_AS_LOCK_ADD:
13323       if (strcasecmp (arg, "yes") == 0)
13324         avoid_fence = 1;
13325       else if (strcasecmp (arg, "no") == 0)
13326         avoid_fence = 0;
13327       else
13328         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13329       break;
13330
13331     case OPTION_MLFENCE_AFTER_LOAD:
13332       if (strcasecmp (arg, "yes") == 0)
13333         lfence_after_load = 1;
13334       else if (strcasecmp (arg, "no") == 0)
13335         lfence_after_load = 0;
13336       else
13337         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13338       break;
13339
13340     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13341       if (strcasecmp (arg, "all") == 0)
13342         {
13343           lfence_before_indirect_branch = lfence_branch_all;
13344           if (lfence_before_ret == lfence_before_ret_none)
13345             lfence_before_ret = lfence_before_ret_shl;
13346         }
13347       else if (strcasecmp (arg, "memory") == 0)
13348         lfence_before_indirect_branch = lfence_branch_memory;
13349       else if (strcasecmp (arg, "register") == 0)
13350         lfence_before_indirect_branch = lfence_branch_register;
13351       else if (strcasecmp (arg, "none") == 0)
13352         lfence_before_indirect_branch = lfence_branch_none;
13353       else
13354         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13355                   arg);
13356       break;
13357
13358     case OPTION_MLFENCE_BEFORE_RET:
13359       if (strcasecmp (arg, "or") == 0)
13360         lfence_before_ret = lfence_before_ret_or;
13361       else if (strcasecmp (arg, "not") == 0)
13362         lfence_before_ret = lfence_before_ret_not;
13363       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13364         lfence_before_ret = lfence_before_ret_shl;
13365       else if (strcasecmp (arg, "none") == 0)
13366         lfence_before_ret = lfence_before_ret_none;
13367       else
13368         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13369                   arg);
13370       break;
13371
13372     case OPTION_MRELAX_RELOCATIONS:
13373       if (strcasecmp (arg, "yes") == 0)
13374         generate_relax_relocations = 1;
13375       else if (strcasecmp (arg, "no") == 0)
13376         generate_relax_relocations = 0;
13377       else
13378         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13379       break;
13380
13381     case OPTION_MALIGN_BRANCH_BOUNDARY:
13382       {
13383         char *end;
13384         long int align = strtoul (arg, &end, 0);
13385         if (*end == '\0')
13386           {
13387             if (align == 0)
13388               {
13389                 align_branch_power = 0;
13390                 break;
13391               }
13392             else if (align >= 16)
13393               {
13394                 int align_power;
13395                 for (align_power = 0;
13396                      (align & 1) == 0;
13397                      align >>= 1, align_power++)
13398                   continue;
13399                 /* Limit alignment power to 31.  */
13400                 if (align == 1 && align_power < 32)
13401                   {
13402                     align_branch_power = align_power;
13403                     break;
13404                   }
13405               }
13406           }
13407         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13408       }
13409       break;
13410
13411     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13412       {
13413         char *end;
13414         int align = strtoul (arg, &end, 0);
13415         /* Some processors only support 5 prefixes.  */
13416         if (*end == '\0' && align >= 0 && align < 6)
13417           {
13418             align_branch_prefix_size = align;
13419             break;
13420           }
13421         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13422                   arg);
13423       }
13424       break;
13425
13426     case OPTION_MALIGN_BRANCH:
13427       align_branch = 0;
13428       saved = xstrdup (arg);
13429       type = saved;
13430       do
13431         {
13432           next = strchr (type, '+');
13433           if (next)
13434             *next++ = '\0';
13435           if (strcasecmp (type, "jcc") == 0)
13436             align_branch |= align_branch_jcc_bit;
13437           else if (strcasecmp (type, "fused") == 0)
13438             align_branch |= align_branch_fused_bit;
13439           else if (strcasecmp (type, "jmp") == 0)
13440             align_branch |= align_branch_jmp_bit;
13441           else if (strcasecmp (type, "call") == 0)
13442             align_branch |= align_branch_call_bit;
13443           else if (strcasecmp (type, "ret") == 0)
13444             align_branch |= align_branch_ret_bit;
13445           else if (strcasecmp (type, "indirect") == 0)
13446             align_branch |= align_branch_indirect_bit;
13447           else
13448             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13449           type = next;
13450         }
13451       while (next != NULL);
13452       free (saved);
13453       break;
13454
13455     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13456       align_branch_power = 5;
13457       align_branch_prefix_size = 5;
13458       align_branch = (align_branch_jcc_bit
13459                       | align_branch_fused_bit
13460                       | align_branch_jmp_bit);
13461       break;
13462
13463     case OPTION_MAMD64:
13464       isa64 = amd64;
13465       break;
13466
13467     case OPTION_MINTEL64:
13468       isa64 = intel64;
13469       break;
13470
13471     case 'O':
13472       if (arg == NULL)
13473         {
13474           optimize = 1;
13475           /* Turn off -Os.  */
13476           optimize_for_space = 0;
13477         }
13478       else if (*arg == 's')
13479         {
13480           optimize_for_space = 1;
13481           /* Turn on all encoding optimizations.  */
13482           optimize = INT_MAX;
13483         }
13484       else
13485         {
13486           optimize = atoi (arg);
13487           /* Turn off -Os.  */
13488           optimize_for_space = 0;
13489         }
13490       break;
13491
13492     default:
13493       return 0;
13494     }
13495   return 1;
13496 }
13497
13498 #define MESSAGE_TEMPLATE \
13499 "                                                                                "
13500
13501 static char *
13502 output_message (FILE *stream, char *p, char *message, char *start,
13503                 int *left_p, const char *name, int len)
13504 {
13505   int size = sizeof (MESSAGE_TEMPLATE);
13506   int left = *left_p;
13507
13508   /* Reserve 2 spaces for ", " or ",\0" */
13509   left -= len + 2;
13510
13511   /* Check if there is any room.  */
13512   if (left >= 0)
13513     {
13514       if (p != start)
13515         {
13516           *p++ = ',';
13517           *p++ = ' ';
13518         }
13519       p = mempcpy (p, name, len);
13520     }
13521   else
13522     {
13523       /* Output the current message now and start a new one.  */
13524       *p++ = ',';
13525       *p = '\0';
13526       fprintf (stream, "%s\n", message);
13527       p = start;
13528       left = size - (start - message) - len - 2;
13529
13530       gas_assert (left >= 0);
13531
13532       p = mempcpy (p, name, len);
13533     }
13534
13535   *left_p = left;
13536   return p;
13537 }
13538
13539 static void
13540 show_arch (FILE *stream, int ext, int check)
13541 {
13542   static char message[] = MESSAGE_TEMPLATE;
13543   char *start = message + 27;
13544   char *p;
13545   int size = sizeof (MESSAGE_TEMPLATE);
13546   int left;
13547   const char *name;
13548   int len;
13549   unsigned int j;
13550
13551   p = start;
13552   left = size - (start - message);
13553   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13554     {
13555       /* Should it be skipped?  */
13556       if (cpu_arch [j].skip)
13557         continue;
13558
13559       name = cpu_arch [j].name;
13560       len = cpu_arch [j].len;
13561       if (*name == '.')
13562         {
13563           /* It is an extension.  Skip if we aren't asked to show it.  */
13564           if (ext)
13565             {
13566               name++;
13567               len--;
13568             }
13569           else
13570             continue;
13571         }
13572       else if (ext)
13573         {
13574           /* It is an processor.  Skip if we show only extension.  */
13575           continue;
13576         }
13577       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13578         {
13579           /* It is an impossible processor - skip.  */
13580           continue;
13581         }
13582
13583       p = output_message (stream, p, message, start, &left, name, len);
13584     }
13585
13586   /* Display disabled extensions.  */
13587   if (ext)
13588     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13589       {
13590         name = cpu_noarch [j].name;
13591         len = cpu_noarch [j].len;
13592         p = output_message (stream, p, message, start, &left, name,
13593                             len);
13594       }
13595
13596   *p = '\0';
13597   fprintf (stream, "%s\n", message);
13598 }
13599
13600 void
13601 md_show_usage (FILE *stream)
13602 {
13603 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13604   fprintf (stream, _("\
13605   -Qy, -Qn                ignored\n\
13606   -V                      print assembler version number\n\
13607   -k                      ignored\n"));
13608 #endif
13609   fprintf (stream, _("\
13610   -n                      Do not optimize code alignment\n\
13611   -q                      quieten some warnings\n"));
13612 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13613   fprintf (stream, _("\
13614   -s                      ignored\n"));
13615 #endif
13616 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13617                       || defined (TE_PE) || defined (TE_PEP))
13618   fprintf (stream, _("\
13619   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13620 #endif
13621 #ifdef SVR4_COMMENT_CHARS
13622   fprintf (stream, _("\
13623   --divide                do not treat `/' as a comment character\n"));
13624 #else
13625   fprintf (stream, _("\
13626   --divide                ignored\n"));
13627 #endif
13628   fprintf (stream, _("\
13629   -march=CPU[,+EXTENSION...]\n\
13630                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13631   show_arch (stream, 0, 1);
13632   fprintf (stream, _("\
13633                           EXTENSION is combination of:\n"));
13634   show_arch (stream, 1, 0);
13635   fprintf (stream, _("\
13636   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13637   show_arch (stream, 0, 0);
13638   fprintf (stream, _("\
13639   -msse2avx               encode SSE instructions with VEX prefix\n"));
13640   fprintf (stream, _("\
13641   -msse-check=[none|error|warning] (default: warning)\n\
13642                           check SSE instructions\n"));
13643   fprintf (stream, _("\
13644   -moperand-check=[none|error|warning] (default: warning)\n\
13645                           check operand combinations for validity\n"));
13646   fprintf (stream, _("\
13647   -mavxscalar=[128|256] (default: 128)\n\
13648                           encode scalar AVX instructions with specific vector\n\
13649                            length\n"));
13650   fprintf (stream, _("\
13651   -mvexwig=[0|1] (default: 0)\n\
13652                           encode VEX instructions with specific VEX.W value\n\
13653                            for VEX.W bit ignored instructions\n"));
13654   fprintf (stream, _("\
13655   -mevexlig=[128|256|512] (default: 128)\n\
13656                           encode scalar EVEX instructions with specific vector\n\
13657                            length\n"));
13658   fprintf (stream, _("\
13659   -mevexwig=[0|1] (default: 0)\n\
13660                           encode EVEX instructions with specific EVEX.W value\n\
13661                            for EVEX.W bit ignored instructions\n"));
13662   fprintf (stream, _("\
13663   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13664                           encode EVEX instructions with specific EVEX.RC value\n\
13665                            for SAE-only ignored instructions\n"));
13666   fprintf (stream, _("\
13667   -mmnemonic=[att|intel] "));
13668   if (SYSV386_COMPAT)
13669     fprintf (stream, _("(default: att)\n"));
13670   else
13671     fprintf (stream, _("(default: intel)\n"));
13672   fprintf (stream, _("\
13673                           use AT&T/Intel mnemonic\n"));
13674   fprintf (stream, _("\
13675   -msyntax=[att|intel] (default: att)\n\
13676                           use AT&T/Intel syntax\n"));
13677   fprintf (stream, _("\
13678   -mindex-reg             support pseudo index registers\n"));
13679   fprintf (stream, _("\
13680   -mnaked-reg             don't require `%%' prefix for registers\n"));
13681   fprintf (stream, _("\
13682   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13683 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13684   fprintf (stream, _("\
13685   -mshared                disable branch optimization for shared code\n"));
13686   fprintf (stream, _("\
13687   -mx86-used-note=[no|yes] "));
13688   if (DEFAULT_X86_USED_NOTE)
13689     fprintf (stream, _("(default: yes)\n"));
13690   else
13691     fprintf (stream, _("(default: no)\n"));
13692   fprintf (stream, _("\
13693                           generate x86 used ISA and feature properties\n"));
13694 #endif
13695 #if defined (TE_PE) || defined (TE_PEP)
13696   fprintf (stream, _("\
13697   -mbig-obj               generate big object files\n"));
13698 #endif
13699   fprintf (stream, _("\
13700   -momit-lock-prefix=[no|yes] (default: no)\n\
13701                           strip all lock prefixes\n"));
13702   fprintf (stream, _("\
13703   -mfence-as-lock-add=[no|yes] (default: no)\n\
13704                           encode lfence, mfence and sfence as\n\
13705                            lock addl $0x0, (%%{re}sp)\n"));
13706   fprintf (stream, _("\
13707   -mrelax-relocations=[no|yes] "));
13708   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13709     fprintf (stream, _("(default: yes)\n"));
13710   else
13711     fprintf (stream, _("(default: no)\n"));
13712   fprintf (stream, _("\
13713                           generate relax relocations\n"));
13714   fprintf (stream, _("\
13715   -malign-branch-boundary=NUM (default: 0)\n\
13716                           align branches within NUM byte boundary\n"));
13717   fprintf (stream, _("\
13718   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13719                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13720                            indirect\n\
13721                           specify types of branches to align\n"));
13722   fprintf (stream, _("\
13723   -malign-branch-prefix-size=NUM (default: 5)\n\
13724                           align branches with NUM prefixes per instruction\n"));
13725   fprintf (stream, _("\
13726   -mbranches-within-32B-boundaries\n\
13727                           align branches within 32 byte boundary\n"));
13728   fprintf (stream, _("\
13729   -mlfence-after-load=[no|yes] (default: no)\n\
13730                           generate lfence after load\n"));
13731   fprintf (stream, _("\
13732   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13733                           generate lfence before indirect near branch\n"));
13734   fprintf (stream, _("\
13735   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13736                           generate lfence before ret\n"));
13737   fprintf (stream, _("\
13738   -mamd64                 accept only AMD64 ISA [default]\n"));
13739   fprintf (stream, _("\
13740   -mintel64               accept only Intel64 ISA\n"));
13741 }
13742
13743 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13744      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13745      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13746
13747 /* Pick the target format to use.  */
13748
13749 const char *
13750 i386_target_format (void)
13751 {
13752   if (!strncmp (default_arch, "x86_64", 6))
13753     {
13754       update_code_flag (CODE_64BIT, 1);
13755       if (default_arch[6] == '\0')
13756         x86_elf_abi = X86_64_ABI;
13757       else
13758         x86_elf_abi = X86_64_X32_ABI;
13759     }
13760   else if (!strcmp (default_arch, "i386"))
13761     update_code_flag (CODE_32BIT, 1);
13762   else if (!strcmp (default_arch, "iamcu"))
13763     {
13764       update_code_flag (CODE_32BIT, 1);
13765       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13766         {
13767           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13768           cpu_arch_name = "iamcu";
13769           cpu_sub_arch_name = NULL;
13770           cpu_arch_flags = iamcu_flags;
13771           cpu_arch_isa = PROCESSOR_IAMCU;
13772           cpu_arch_isa_flags = iamcu_flags;
13773           if (!cpu_arch_tune_set)
13774             {
13775               cpu_arch_tune = cpu_arch_isa;
13776               cpu_arch_tune_flags = cpu_arch_isa_flags;
13777             }
13778         }
13779       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13780         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13781                   cpu_arch_name);
13782     }
13783   else
13784     as_fatal (_("unknown architecture"));
13785
13786   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13787     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13788   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13789     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13790
13791   switch (OUTPUT_FLAVOR)
13792     {
13793 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13794     case bfd_target_aout_flavour:
13795       return AOUT_TARGET_FORMAT;
13796 #endif
13797 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13798 # if defined (TE_PE) || defined (TE_PEP)
13799     case bfd_target_coff_flavour:
13800       if (flag_code == CODE_64BIT)
13801         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13802       else
13803         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13804 # elif defined (TE_GO32)
13805     case bfd_target_coff_flavour:
13806       return "coff-go32";
13807 # else
13808     case bfd_target_coff_flavour:
13809       return "coff-i386";
13810 # endif
13811 #endif
13812 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13813     case bfd_target_elf_flavour:
13814       {
13815         const char *format;
13816
13817         switch (x86_elf_abi)
13818           {
13819           default:
13820             format = ELF_TARGET_FORMAT;
13821 #ifndef TE_SOLARIS
13822             tls_get_addr = "___tls_get_addr";
13823 #endif
13824             break;
13825           case X86_64_ABI:
13826             use_rela_relocations = 1;
13827             object_64bit = 1;
13828 #ifndef TE_SOLARIS
13829             tls_get_addr = "__tls_get_addr";
13830 #endif
13831             format = ELF_TARGET_FORMAT64;
13832             break;
13833           case X86_64_X32_ABI:
13834             use_rela_relocations = 1;
13835             object_64bit = 1;
13836 #ifndef TE_SOLARIS
13837             tls_get_addr = "__tls_get_addr";
13838 #endif
13839             disallow_64bit_reloc = 1;
13840             format = ELF_TARGET_FORMAT32;
13841             break;
13842           }
13843         if (cpu_arch_isa == PROCESSOR_L1OM)
13844           {
13845             if (x86_elf_abi != X86_64_ABI)
13846               as_fatal (_("Intel L1OM is 64bit only"));
13847             return ELF_TARGET_L1OM_FORMAT;
13848           }
13849         else if (cpu_arch_isa == PROCESSOR_K1OM)
13850           {
13851             if (x86_elf_abi != X86_64_ABI)
13852               as_fatal (_("Intel K1OM is 64bit only"));
13853             return ELF_TARGET_K1OM_FORMAT;
13854           }
13855         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13856           {
13857             if (x86_elf_abi != I386_ABI)
13858               as_fatal (_("Intel MCU is 32bit only"));
13859             return ELF_TARGET_IAMCU_FORMAT;
13860           }
13861         else
13862           return format;
13863       }
13864 #endif
13865 #if defined (OBJ_MACH_O)
13866     case bfd_target_mach_o_flavour:
13867       if (flag_code == CODE_64BIT)
13868         {
13869           use_rela_relocations = 1;
13870           object_64bit = 1;
13871           return "mach-o-x86-64";
13872         }
13873       else
13874         return "mach-o-i386";
13875 #endif
13876     default:
13877       abort ();
13878       return NULL;
13879     }
13880 }
13881
13882 #endif /* OBJ_MAYBE_ more than one  */
13883 \f
13884 symbolS *
13885 md_undefined_symbol (char *name)
13886 {
13887   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13888       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13889       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13890       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13891     {
13892       if (!GOT_symbol)
13893         {
13894           if (symbol_find (name))
13895             as_bad (_("GOT already in symbol table"));
13896           GOT_symbol = symbol_new (name, undefined_section,
13897                                    &zero_address_frag, 0);
13898         };
13899       return GOT_symbol;
13900     }
13901   return 0;
13902 }
13903
13904 /* Round up a section size to the appropriate boundary.  */
13905
13906 valueT
13907 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13908 {
13909 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13910   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13911     {
13912       /* For a.out, force the section size to be aligned.  If we don't do
13913          this, BFD will align it for us, but it will not write out the
13914          final bytes of the section.  This may be a bug in BFD, but it is
13915          easier to fix it here since that is how the other a.out targets
13916          work.  */
13917       int align;
13918
13919       align = bfd_section_alignment (segment);
13920       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13921     }
13922 #endif
13923
13924   return size;
13925 }
13926
13927 /* On the i386, PC-relative offsets are relative to the start of the
13928    next instruction.  That is, the address of the offset, plus its
13929    size, since the offset is always the last part of the insn.  */
13930
13931 long
13932 md_pcrel_from (fixS *fixP)
13933 {
13934   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13935 }
13936
13937 #ifndef I386COFF
13938
13939 static void
13940 s_bss (int ignore ATTRIBUTE_UNUSED)
13941 {
13942   int temp;
13943
13944 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13945   if (IS_ELF)
13946     obj_elf_section_change_hook ();
13947 #endif
13948   temp = get_absolute_expression ();
13949   subseg_set (bss_section, (subsegT) temp);
13950   demand_empty_rest_of_line ();
13951 }
13952
13953 #endif
13954
13955 /* Remember constant directive.  */
13956
13957 void
13958 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13959 {
13960   if (last_insn.kind != last_insn_directive
13961       && (bfd_section_flags (now_seg) & SEC_CODE))
13962     {
13963       last_insn.seg = now_seg;
13964       last_insn.kind = last_insn_directive;
13965       last_insn.name = "constant directive";
13966       last_insn.file = as_where (&last_insn.line);
13967       if (lfence_before_ret != lfence_before_ret_none)
13968         {
13969           if (lfence_before_indirect_branch != lfence_branch_none)
13970             as_warn (_("constant directive skips -mlfence-before-ret "
13971                        "and -mlfence-before-indirect-branch"));
13972           else
13973             as_warn (_("constant directive skips -mlfence-before-ret"));
13974         }
13975       else if (lfence_before_indirect_branch != lfence_branch_none)
13976         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13977     }
13978 }
13979
13980 void
13981 i386_validate_fix (fixS *fixp)
13982 {
13983   if (fixp->fx_subsy)
13984     {
13985       if (fixp->fx_subsy == GOT_symbol)
13986         {
13987           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13988             {
13989               if (!object_64bit)
13990                 abort ();
13991 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13992               if (fixp->fx_tcbit2)
13993                 fixp->fx_r_type = (fixp->fx_tcbit
13994                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13995                                    : BFD_RELOC_X86_64_GOTPCRELX);
13996               else
13997 #endif
13998                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13999             }
14000           else
14001             {
14002               if (!object_64bit)
14003                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
14004               else
14005                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
14006             }
14007           fixp->fx_subsy = 0;
14008         }
14009     }
14010 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14011   else
14012     {
14013       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
14014          to section.  Since PLT32 relocation must be against symbols,
14015          turn such PLT32 relocation into PC32 relocation.  */
14016       if (fixp->fx_addsy
14017           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
14018               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
14019           && symbol_section_p (fixp->fx_addsy))
14020         fixp->fx_r_type = BFD_RELOC_32_PCREL;
14021       if (!object_64bit)
14022         {
14023           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
14024               && fixp->fx_tcbit2)
14025             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14026         }
14027     }
14028 #endif
14029 }
14030
14031 arelent *
14032 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14033 {
14034   arelent *rel;
14035   bfd_reloc_code_real_type code;
14036
14037   switch (fixp->fx_r_type)
14038     {
14039 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14040     case BFD_RELOC_SIZE32:
14041     case BFD_RELOC_SIZE64:
14042       if (S_IS_DEFINED (fixp->fx_addsy)
14043           && !S_IS_EXTERNAL (fixp->fx_addsy))
14044         {
14045           /* Resolve size relocation against local symbol to size of
14046              the symbol plus addend.  */
14047           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
14048           if (fixp->fx_r_type == BFD_RELOC_SIZE32
14049               && !fits_in_unsigned_long (value))
14050             as_bad_where (fixp->fx_file, fixp->fx_line,
14051                           _("symbol size computation overflow"));
14052           fixp->fx_addsy = NULL;
14053           fixp->fx_subsy = NULL;
14054           md_apply_fix (fixp, (valueT *) &value, NULL);
14055           return NULL;
14056         }
14057 #endif
14058       /* Fall through.  */
14059
14060     case BFD_RELOC_X86_64_PLT32:
14061     case BFD_RELOC_X86_64_GOT32:
14062     case BFD_RELOC_X86_64_GOTPCREL:
14063     case BFD_RELOC_X86_64_GOTPCRELX:
14064     case BFD_RELOC_X86_64_REX_GOTPCRELX:
14065     case BFD_RELOC_386_PLT32:
14066     case BFD_RELOC_386_GOT32:
14067     case BFD_RELOC_386_GOT32X:
14068     case BFD_RELOC_386_GOTOFF:
14069     case BFD_RELOC_386_GOTPC:
14070     case BFD_RELOC_386_TLS_GD:
14071     case BFD_RELOC_386_TLS_LDM:
14072     case BFD_RELOC_386_TLS_LDO_32:
14073     case BFD_RELOC_386_TLS_IE_32:
14074     case BFD_RELOC_386_TLS_IE:
14075     case BFD_RELOC_386_TLS_GOTIE:
14076     case BFD_RELOC_386_TLS_LE_32:
14077     case BFD_RELOC_386_TLS_LE:
14078     case BFD_RELOC_386_TLS_GOTDESC:
14079     case BFD_RELOC_386_TLS_DESC_CALL:
14080     case BFD_RELOC_X86_64_TLSGD:
14081     case BFD_RELOC_X86_64_TLSLD:
14082     case BFD_RELOC_X86_64_DTPOFF32:
14083     case BFD_RELOC_X86_64_DTPOFF64:
14084     case BFD_RELOC_X86_64_GOTTPOFF:
14085     case BFD_RELOC_X86_64_TPOFF32:
14086     case BFD_RELOC_X86_64_TPOFF64:
14087     case BFD_RELOC_X86_64_GOTOFF64:
14088     case BFD_RELOC_X86_64_GOTPC32:
14089     case BFD_RELOC_X86_64_GOT64:
14090     case BFD_RELOC_X86_64_GOTPCREL64:
14091     case BFD_RELOC_X86_64_GOTPC64:
14092     case BFD_RELOC_X86_64_GOTPLT64:
14093     case BFD_RELOC_X86_64_PLTOFF64:
14094     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14095     case BFD_RELOC_X86_64_TLSDESC_CALL:
14096     case BFD_RELOC_RVA:
14097     case BFD_RELOC_VTABLE_ENTRY:
14098     case BFD_RELOC_VTABLE_INHERIT:
14099 #ifdef TE_PE
14100     case BFD_RELOC_32_SECREL:
14101 #endif
14102       code = fixp->fx_r_type;
14103       break;
14104     case BFD_RELOC_X86_64_32S:
14105       if (!fixp->fx_pcrel)
14106         {
14107           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
14108           code = fixp->fx_r_type;
14109           break;
14110         }
14111       /* Fall through.  */
14112     default:
14113       if (fixp->fx_pcrel)
14114         {
14115           switch (fixp->fx_size)
14116             {
14117             default:
14118               as_bad_where (fixp->fx_file, fixp->fx_line,
14119                             _("can not do %d byte pc-relative relocation"),
14120                             fixp->fx_size);
14121               code = BFD_RELOC_32_PCREL;
14122               break;
14123             case 1: code = BFD_RELOC_8_PCREL;  break;
14124             case 2: code = BFD_RELOC_16_PCREL; break;
14125             case 4: code = BFD_RELOC_32_PCREL; break;
14126 #ifdef BFD64
14127             case 8: code = BFD_RELOC_64_PCREL; break;
14128 #endif
14129             }
14130         }
14131       else
14132         {
14133           switch (fixp->fx_size)
14134             {
14135             default:
14136               as_bad_where (fixp->fx_file, fixp->fx_line,
14137                             _("can not do %d byte relocation"),
14138                             fixp->fx_size);
14139               code = BFD_RELOC_32;
14140               break;
14141             case 1: code = BFD_RELOC_8;  break;
14142             case 2: code = BFD_RELOC_16; break;
14143             case 4: code = BFD_RELOC_32; break;
14144 #ifdef BFD64
14145             case 8: code = BFD_RELOC_64; break;
14146 #endif
14147             }
14148         }
14149       break;
14150     }
14151
14152   if ((code == BFD_RELOC_32
14153        || code == BFD_RELOC_32_PCREL
14154        || code == BFD_RELOC_X86_64_32S)
14155       && GOT_symbol
14156       && fixp->fx_addsy == GOT_symbol)
14157     {
14158       if (!object_64bit)
14159         code = BFD_RELOC_386_GOTPC;
14160       else
14161         code = BFD_RELOC_X86_64_GOTPC32;
14162     }
14163   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14164       && GOT_symbol
14165       && fixp->fx_addsy == GOT_symbol)
14166     {
14167       code = BFD_RELOC_X86_64_GOTPC64;
14168     }
14169
14170   rel = XNEW (arelent);
14171   rel->sym_ptr_ptr = XNEW (asymbol *);
14172   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14173
14174   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14175
14176   if (!use_rela_relocations)
14177     {
14178       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14179          vtable entry to be used in the relocation's section offset.  */
14180       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14181         rel->address = fixp->fx_offset;
14182 #if defined (OBJ_COFF) && defined (TE_PE)
14183       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14184         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14185       else
14186 #endif
14187       rel->addend = 0;
14188     }
14189   /* Use the rela in 64bit mode.  */
14190   else
14191     {
14192       if (disallow_64bit_reloc)
14193         switch (code)
14194           {
14195           case BFD_RELOC_X86_64_DTPOFF64:
14196           case BFD_RELOC_X86_64_TPOFF64:
14197           case BFD_RELOC_64_PCREL:
14198           case BFD_RELOC_X86_64_GOTOFF64:
14199           case BFD_RELOC_X86_64_GOT64:
14200           case BFD_RELOC_X86_64_GOTPCREL64:
14201           case BFD_RELOC_X86_64_GOTPC64:
14202           case BFD_RELOC_X86_64_GOTPLT64:
14203           case BFD_RELOC_X86_64_PLTOFF64:
14204             as_bad_where (fixp->fx_file, fixp->fx_line,
14205                           _("cannot represent relocation type %s in x32 mode"),
14206                           bfd_get_reloc_code_name (code));
14207             break;
14208           default:
14209             break;
14210           }
14211
14212       if (!fixp->fx_pcrel)
14213         rel->addend = fixp->fx_offset;
14214       else
14215         switch (code)
14216           {
14217           case BFD_RELOC_X86_64_PLT32:
14218           case BFD_RELOC_X86_64_GOT32:
14219           case BFD_RELOC_X86_64_GOTPCREL:
14220           case BFD_RELOC_X86_64_GOTPCRELX:
14221           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14222           case BFD_RELOC_X86_64_TLSGD:
14223           case BFD_RELOC_X86_64_TLSLD:
14224           case BFD_RELOC_X86_64_GOTTPOFF:
14225           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14226           case BFD_RELOC_X86_64_TLSDESC_CALL:
14227             rel->addend = fixp->fx_offset - fixp->fx_size;
14228             break;
14229           default:
14230             rel->addend = (section->vma
14231                            - fixp->fx_size
14232                            + fixp->fx_addnumber
14233                            + md_pcrel_from (fixp));
14234             break;
14235           }
14236     }
14237
14238   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14239   if (rel->howto == NULL)
14240     {
14241       as_bad_where (fixp->fx_file, fixp->fx_line,
14242                     _("cannot represent relocation type %s"),
14243                     bfd_get_reloc_code_name (code));
14244       /* Set howto to a garbage value so that we can keep going.  */
14245       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14246       gas_assert (rel->howto != NULL);
14247     }
14248
14249   return rel;
14250 }
14251
14252 #include "tc-i386-intel.c"
14253
14254 void
14255 tc_x86_parse_to_dw2regnum (expressionS *exp)
14256 {
14257   int saved_naked_reg;
14258   char saved_register_dot;
14259
14260   saved_naked_reg = allow_naked_reg;
14261   allow_naked_reg = 1;
14262   saved_register_dot = register_chars['.'];
14263   register_chars['.'] = '.';
14264   allow_pseudo_reg = 1;
14265   expression_and_evaluate (exp);
14266   allow_pseudo_reg = 0;
14267   register_chars['.'] = saved_register_dot;
14268   allow_naked_reg = saved_naked_reg;
14269
14270   if (exp->X_op == O_register && exp->X_add_number >= 0)
14271     {
14272       if ((addressT) exp->X_add_number < i386_regtab_size)
14273         {
14274           exp->X_op = O_constant;
14275           exp->X_add_number = i386_regtab[exp->X_add_number]
14276                               .dw2_regnum[flag_code >> 1];
14277         }
14278       else
14279         exp->X_op = O_illegal;
14280     }
14281 }
14282
14283 void
14284 tc_x86_frame_initial_instructions (void)
14285 {
14286   static unsigned int sp_regno[2];
14287
14288   if (!sp_regno[flag_code >> 1])
14289     {
14290       char *saved_input = input_line_pointer;
14291       char sp[][4] = {"esp", "rsp"};
14292       expressionS exp;
14293
14294       input_line_pointer = sp[flag_code >> 1];
14295       tc_x86_parse_to_dw2regnum (&exp);
14296       gas_assert (exp.X_op == O_constant);
14297       sp_regno[flag_code >> 1] = exp.X_add_number;
14298       input_line_pointer = saved_input;
14299     }
14300
14301   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14302   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14303 }
14304
14305 int
14306 x86_dwarf2_addr_size (void)
14307 {
14308 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14309   if (x86_elf_abi == X86_64_X32_ABI)
14310     return 4;
14311 #endif
14312   return bfd_arch_bits_per_address (stdoutput) / 8;
14313 }
14314
14315 int
14316 i386_elf_section_type (const char *str, size_t len)
14317 {
14318   if (flag_code == CODE_64BIT
14319       && len == sizeof ("unwind") - 1
14320       && strncmp (str, "unwind", 6) == 0)
14321     return SHT_X86_64_UNWIND;
14322
14323   return -1;
14324 }
14325
14326 #ifdef TE_SOLARIS
14327 void
14328 i386_solaris_fix_up_eh_frame (segT sec)
14329 {
14330   if (flag_code == CODE_64BIT)
14331     elf_section_type (sec) = SHT_X86_64_UNWIND;
14332 }
14333 #endif
14334
14335 #ifdef TE_PE
14336 void
14337 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14338 {
14339   expressionS exp;
14340
14341   exp.X_op = O_secrel;
14342   exp.X_add_symbol = symbol;
14343   exp.X_add_number = 0;
14344   emit_expr (&exp, size);
14345 }
14346 #endif
14347
14348 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14349 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14350
14351 bfd_vma
14352 x86_64_section_letter (int letter, const char **ptr_msg)
14353 {
14354   if (flag_code == CODE_64BIT)
14355     {
14356       if (letter == 'l')
14357         return SHF_X86_64_LARGE;
14358
14359       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14360     }
14361   else
14362     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14363   return -1;
14364 }
14365
14366 bfd_vma
14367 x86_64_section_word (char *str, size_t len)
14368 {
14369   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14370     return SHF_X86_64_LARGE;
14371
14372   return -1;
14373 }
14374
14375 static void
14376 handle_large_common (int small ATTRIBUTE_UNUSED)
14377 {
14378   if (flag_code != CODE_64BIT)
14379     {
14380       s_comm_internal (0, elf_common_parse);
14381       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14382     }
14383   else
14384     {
14385       static segT lbss_section;
14386       asection *saved_com_section_ptr = elf_com_section_ptr;
14387       asection *saved_bss_section = bss_section;
14388
14389       if (lbss_section == NULL)
14390         {
14391           flagword applicable;
14392           segT seg = now_seg;
14393           subsegT subseg = now_subseg;
14394
14395           /* The .lbss section is for local .largecomm symbols.  */
14396           lbss_section = subseg_new (".lbss", 0);
14397           applicable = bfd_applicable_section_flags (stdoutput);
14398           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14399           seg_info (lbss_section)->bss = 1;
14400
14401           subseg_set (seg, subseg);
14402         }
14403
14404       elf_com_section_ptr = &_bfd_elf_large_com_section;
14405       bss_section = lbss_section;
14406
14407       s_comm_internal (0, elf_common_parse);
14408
14409       elf_com_section_ptr = saved_com_section_ptr;
14410       bss_section = saved_bss_section;
14411     }
14412 }
14413 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */