gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2021 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_sib_address,
 294     invalid_vsib_address,
 295     invalid_vector_register_set,
 296     invalid_tmm_register_set,
 297     unsupported_vector_index_register,
 298     unsupported_broadcast,
 299     broadcast_needed,
 300     unsupported_masking,
 301     mask_not_on_destination,
 302     no_default_mask,
 303     unsupported_rc_sae,
 304     rc_sae_operand_not_last_imm,
 305     invalid_register_operand,
 306   };
 307
 308 struct _i386_insn
 309   {
 310     /* TM holds the template for the insn were currently assembling.  */
 311     insn_template tm;
 312
 313     /* SUFFIX holds the instruction size suffix for byte, word, dword
 314        or qword, if given.  */
 315     char suffix;
 316
 317     /* OPERANDS gives the number of given operands.  */
 318     unsigned int operands;
 319
 320     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 321        of given register, displacement, memory operands and immediate
 322        operands.  */
 323     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 324
 325     /* TYPES [i] is the type (see above #defines) which tells us how to
 326        use OP[i] for the corresponding operand.  */
 327     i386_operand_type types[MAX_OPERANDS];
 328
 329     /* Displacement expression, immediate expression, or register for each
 330        operand.  */
 331     union i386_op op[MAX_OPERANDS];
 332
 333     /* Flags for operands.  */
 334     unsigned int flags[MAX_OPERANDS];
 335 #define Operand_PCrel 1
 336 #define Operand_Mem   2
 337
 338     /* Relocation type for operand */
 339     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 340
 341     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 342        the base index byte below.  */
 343     const reg_entry *base_reg;
 344     const reg_entry *index_reg;
 345     unsigned int log2_scale_factor;
 346
 347     /* SEG gives the seg_entries of this insn.  They are zero unless
 348        explicit segment overrides are given.  */
 349     const seg_entry *seg[2];
 350
 351     /* Copied first memory operand string, for re-checking.  */
 352     char *memop1_string;
 353
 354     /* PREFIX holds all the given prefix opcodes (usually null).
 355        PREFIXES is the number of prefix opcodes.  */
 356     unsigned int prefixes;
 357     unsigned char prefix[MAX_PREFIXES];
 358
 359     /* Register is in low 3 bits of opcode.  */
 360     bfd_boolean short_form;
 361
 362     /* The operand to a branch insn indicates an absolute branch.  */
 363     bfd_boolean jumpabsolute;
 364
 365     /* Extended states.  */
 366     enum
 367       {
 368         /* Use MMX state.  */
 369         xstate_mmx = 1 << 0,
 370         /* Use XMM state.  */
 371         xstate_xmm = 1 << 1,
 372         /* Use YMM state.  */
 373         xstate_ymm = 1 << 2 | xstate_xmm,
 374         /* Use ZMM state.  */
 375         xstate_zmm = 1 << 3 | xstate_ymm,
 376         /* Use TMM state.  */
 377         xstate_tmm = 1 << 4,
 378         /* Use MASK state.  */
 379         xstate_mask = 1 << 5
 380       } xstate;
 381
 382     /* Has GOTPC or TLS relocation.  */
 383     bfd_boolean has_gotpc_tls_reloc;
 384
 385     /* RM and SIB are the modrm byte and the sib byte where the
 386        addressing modes of this insn are encoded.  */
 387     modrm_byte rm;
 388     rex_byte rex;
 389     rex_byte vrex;
 390     sib_byte sib;
 391     vex_prefix vex;
 392
 393     /* Masking attributes.  */
 394     struct Mask_Operation *mask;
 395
 396     /* Rounding control and SAE attributes.  */
 397     struct RC_Operation *rounding;
 398
 399     /* Broadcasting attributes.  */
 400     struct Broadcast_Operation *broadcast;
 401
 402     /* Compressed disp8*N attribute.  */
 403     unsigned int memshift;
 404
 405     /* Prefer load or store in encoding.  */
 406     enum
 407       {
 408         dir_encoding_default = 0,
 409         dir_encoding_load,
 410         dir_encoding_store,
 411         dir_encoding_swap
 412       } dir_encoding;
 413
 414     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 415     enum
 416       {
 417         disp_encoding_default = 0,
 418         disp_encoding_8bit,
 419         disp_encoding_16bit,
 420         disp_encoding_32bit
 421       } disp_encoding;
 422
 423     /* Prefer the REX byte in encoding.  */
 424     bfd_boolean rex_encoding;
 425
 426     /* Disable instruction size optimization.  */
 427     bfd_boolean no_optimize;
 428
 429     /* How to encode vector instructions.  */
 430     enum
 431       {
 432         vex_encoding_default = 0,
 433         vex_encoding_vex,
 434         vex_encoding_vex3,
 435         vex_encoding_evex,
 436         vex_encoding_error
 437       } vec_encoding;
 438
 439     /* REP prefix.  */
 440     const char *rep_prefix;
 441
 442     /* HLE prefix.  */
 443     const char *hle_prefix;
 444
 445     /* Have BND prefix.  */
 446     const char *bnd_prefix;
 447
 448     /* Have NOTRACK prefix.  */
 449     const char *notrack_prefix;
 450
 451     /* Error message.  */
 452     enum i386_error error;
 453   };
 454
 455 typedef struct _i386_insn i386_insn;
 456
 457 /* Link RC type with corresponding string, that'll be looked for in
 458    asm.  */
 459 struct RC_name
 460 {
 461   enum rc_type type;
 462   const char *name;
 463   unsigned int len;
 464 };
 465
 466 static const struct RC_name RC_NamesTable[] =
 467 {
 468   {  rne, STRING_COMMA_LEN ("rn-sae") },
 469   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 470   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 471   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 472   {  saeonly,  STRING_COMMA_LEN ("sae") },
 473 };
 474
 475 /* List of chars besides those in app.c:symbol_chars that can start an
 476    operand.  Used to prevent the scrubber eating vital white-space.  */
 477 const char extra_symbol_chars[] = "*%-([{}"
 478 #ifdef LEX_AT
 479         "@"
 480 #endif
 481 #ifdef LEX_QM
 482         "?"
 483 #endif
 484         ;
 485
 486 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 487      && !defined (TE_GNU)                               \
 488      && !defined (TE_LINUX)                             \
 489      && !defined (TE_FreeBSD)                           \
 490      && !defined (TE_DragonFly)                         \
 491      && !defined (TE_NetBSD))
 492 /* This array holds the chars that always start a comment.  If the
 493    pre-processor is disabled, these aren't very useful.  The option
 494    --divide will remove '/' from this list.  */
 495 const char *i386_comment_chars = "#/";
 496 #define SVR4_COMMENT_CHARS 1
 497 #define PREFIX_SEPARATOR '\\'
 498
 499 #else
 500 const char *i386_comment_chars = "#";
 501 #define PREFIX_SEPARATOR '/'
 502 #endif
 503
 504 /* This array holds the chars that only start a comment at the beginning of
 505    a line.  If the line seems to have the form '# 123 filename'
 506    .line and .file directives will appear in the pre-processed output.
 507    Note that input_file.c hand checks for '#' at the beginning of the
 508    first line of the input file.  This is because the compiler outputs
 509    #NO_APP at the beginning of its output.
 510    Also note that comments started like this one will always work if
 511    '/' isn't otherwise defined.  */
 512 const char line_comment_chars[] = "#/";
 513
 514 const char line_separator_chars[] = ";";
 515
 516 /* Chars that can be used to separate mant from exp in floating point
 517    nums.  */
 518 const char EXP_CHARS[] = "eE";
 519
 520 /* Chars that mean this number is a floating point constant
 521    As in 0f12.456
 522    or    0d1.2345e12.  */
 523 const char FLT_CHARS[] = "fFdDxX";
 524
 525 /* Tables for lexical analysis.  */
 526 static char mnemonic_chars[256];
 527 static char register_chars[256];
 528 static char operand_chars[256];
 529 static char identifier_chars[256];
 530 static char digit_chars[256];
 531
 532 /* Lexical macros.  */
 533 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 534 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 535 #define is_register_char(x) (register_chars[(unsigned char) x])
 536 #define is_space_char(x) ((x) == ' ')
 537 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 538 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 539
 540 /* All non-digit non-letter characters that may occur in an operand.  */
 541 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 542
 543 /* md_assemble() always leaves the strings it's passed unaltered.  To
 544    effect this we maintain a stack of saved characters that we've smashed
 545    with '\0's (indicating end of strings for various sub-fields of the
 546    assembler instruction).  */
 547 static char save_stack[32];
 548 static char *save_stack_p;
 549 #define END_STRING_AND_SAVE(s) \
 550         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 551 #define RESTORE_END_STRING(s) \
 552         do { *(s) = *--save_stack_p; } while (0)
 553
 554 /* The instruction we're assembling.  */
 555 static i386_insn i;
 556
 557 /* Possible templates for current insn.  */
 558 static const templates *current_templates;
 559
 560 /* Per instruction expressionS buffers: max displacements & immediates.  */
 561 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 562 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 563
 564 /* Current operand we are working on.  */
 565 static int this_operand = -1;
 566
 567 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 568    these.  */
 569
 570 enum flag_code {
 571         CODE_32BIT,
 572         CODE_16BIT,
 573         CODE_64BIT };
 574
 575 static enum flag_code flag_code;
 576 static unsigned int object_64bit;
 577 static unsigned int disallow_64bit_reloc;
 578 static int use_rela_relocations = 0;
 579 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 580 static const char *tls_get_addr;
 581
 582 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 583      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 584      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 585
 586 /* The ELF ABI to use.  */
 587 enum x86_elf_abi
 588 {
 589   I386_ABI,
 590   X86_64_ABI,
 591   X86_64_X32_ABI
 592 };
 593
 594 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 595 #endif
 596
 597 #if defined (TE_PE) || defined (TE_PEP)
 598 /* Use big object file format.  */
 599 static int use_big_obj = 0;
 600 #endif
 601
 602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 603 /* 1 if generating code for a shared library.  */
 604 static int shared = 0;
 605 #endif
 606
 607 /* 1 for intel syntax,
 608    0 if att syntax.  */
 609 static int intel_syntax = 0;
 610
 611 static enum x86_64_isa
 612 {
 613   amd64 = 1,    /* AMD64 ISA.  */
 614   intel64       /* Intel64 ISA.  */
 615 } isa64;
 616
 617 /* 1 for intel mnemonic,
 618    0 if att mnemonic.  */
 619 static int intel_mnemonic = !SYSV386_COMPAT;
 620
 621 /* 1 if pseudo registers are permitted.  */
 622 static int allow_pseudo_reg = 0;
 623
 624 /* 1 if register prefix % not required.  */
 625 static int allow_naked_reg = 0;
 626
 627 /* 1 if the assembler should add BND prefix for all control-transferring
 628    instructions supporting it, even if this prefix wasn't specified
 629    explicitly.  */
 630 static int add_bnd_prefix = 0;
 631
 632 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 633 static int allow_index_reg = 0;
 634
 635 /* 1 if the assembler should ignore LOCK prefix, even if it was
 636    specified explicitly.  */
 637 static int omit_lock_prefix = 0;
 638
 639 /* 1 if the assembler should encode lfence, mfence, and sfence as
 640    "lock addl $0, (%{re}sp)".  */
 641 static int avoid_fence = 0;
 642
 643 /* 1 if lfence should be inserted after every load.  */
 644 static int lfence_after_load = 0;
 645
 646 /* Non-zero if lfence should be inserted before indirect branch.  */
 647 static enum lfence_before_indirect_branch_kind
 648   {
 649     lfence_branch_none = 0,
 650     lfence_branch_register,
 651     lfence_branch_memory,
 652     lfence_branch_all
 653   }
 654 lfence_before_indirect_branch;
 655
 656 /* Non-zero if lfence should be inserted before ret.  */
 657 static enum lfence_before_ret_kind
 658   {
 659     lfence_before_ret_none = 0,
 660     lfence_before_ret_not,
 661     lfence_before_ret_or,
 662     lfence_before_ret_shl
 663   }
 664 lfence_before_ret;
 665
 666 /* Types of previous instruction is .byte or prefix.  */
 667 static struct
 668   {
 669     segT seg;
 670     const char *file;
 671     const char *name;
 672     unsigned int line;
 673     enum last_insn_kind
 674       {
 675         last_insn_other = 0,
 676         last_insn_directive,
 677         last_insn_prefix
 678       } kind;
 679   } last_insn;
 680
 681 /* 1 if the assembler should generate relax relocations.  */
 682
 683 static int generate_relax_relocations
 684   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 685
 686 static enum check_kind
 687   {
 688     check_none = 0,
 689     check_warning,
 690     check_error
 691   }
 692 sse_check, operand_check = check_warning;
 693
 694 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 695 static int align_branch_power = 0;
 696
 697 /* Types of branches to align.  */
 698 enum align_branch_kind
 699   {
 700     align_branch_none = 0,
 701     align_branch_jcc = 1,
 702     align_branch_fused = 2,
 703     align_branch_jmp = 3,
 704     align_branch_call = 4,
 705     align_branch_indirect = 5,
 706     align_branch_ret = 6
 707   };
 708
 709 /* Type bits of branches to align.  */
 710 enum align_branch_bit
 711   {
 712     align_branch_jcc_bit = 1 << align_branch_jcc,
 713     align_branch_fused_bit = 1 << align_branch_fused,
 714     align_branch_jmp_bit = 1 << align_branch_jmp,
 715     align_branch_call_bit = 1 << align_branch_call,
 716     align_branch_indirect_bit = 1 << align_branch_indirect,
 717     align_branch_ret_bit = 1 << align_branch_ret
 718   };
 719
 720 static unsigned int align_branch = (align_branch_jcc_bit
 721                                     | align_branch_fused_bit
 722                                     | align_branch_jmp_bit);
 723
 724 /* Types of condition jump used by macro-fusion.  */
 725 enum mf_jcc_kind
 726   {
 727     mf_jcc_jo = 0,  /* base opcode 0x70  */
 728     mf_jcc_jc,      /* base opcode 0x72  */
 729     mf_jcc_je,      /* base opcode 0x74  */
 730     mf_jcc_jna,     /* base opcode 0x76  */
 731     mf_jcc_js,      /* base opcode 0x78  */
 732     mf_jcc_jp,      /* base opcode 0x7a  */
 733     mf_jcc_jl,      /* base opcode 0x7c  */
 734     mf_jcc_jle,     /* base opcode 0x7e  */
 735   };
 736
 737 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 738 enum mf_cmp_kind
 739   {
 740     mf_cmp_test_and,  /* test/cmp */
 741     mf_cmp_alu_cmp,  /* add/sub/cmp */
 742     mf_cmp_incdec  /* inc/dec */
 743   };
 744
 745 /* The maximum padding size for fused jcc.  CMP like instruction can
 746    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 747    prefixes.   */
 748 #define MAX_FUSED_JCC_PADDING_SIZE 20
 749
 750 /* The maximum number of prefixes added for an instruction.  */
 751 static unsigned int align_branch_prefix_size = 5;
 752
 753 /* Optimization:
 754    1. Clear the REX_W bit with register operand if possible.
 755    2. Above plus use 128bit vector instruction to clear the full vector
 756       register.
 757  */
 758 static int optimize = 0;
 759
 760 /* Optimization:
 761    1. Clear the REX_W bit with register operand if possible.
 762    2. Above plus use 128bit vector instruction to clear the full vector
 763       register.
 764    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 765       "testb $imm7,%r8".
 766  */
 767 static int optimize_for_space = 0;
 768
 769 /* Register prefix used for error message.  */
 770 static const char *register_prefix = "%";
 771
 772 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 773    leave, push, and pop instructions so that gcc has the same stack
 774    frame as in 32 bit mode.  */
 775 static char stackop_size = '\0';
 776
 777 /* Non-zero to optimize code alignment.  */
 778 int optimize_align_code = 1;
 779
 780 /* Non-zero to quieten some warnings.  */
 781 static int quiet_warnings = 0;
 782
 783 /* CPU name.  */
 784 static const char *cpu_arch_name = NULL;
 785 static char *cpu_sub_arch_name = NULL;
 786
 787 /* CPU feature flags.  */
 788 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 789
 790 /* If we have selected a cpu we are generating instructions for.  */
 791 static int cpu_arch_tune_set = 0;
 792
 793 /* Cpu we are generating instructions for.  */
 794 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 795
 796 /* CPU feature flags of cpu we are generating instructions for.  */
 797 static i386_cpu_flags cpu_arch_tune_flags;
 798
 799 /* CPU instruction set architecture used.  */
 800 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 801
 802 /* CPU feature flags of instruction set architecture used.  */
 803 i386_cpu_flags cpu_arch_isa_flags;
 804
 805 /* If set, conditional jumps are not automatically promoted to handle
 806    larger than a byte offset.  */
 807 static unsigned int no_cond_jump_promotion = 0;
 808
 809 /* Encode SSE instructions with VEX prefix.  */
 810 static unsigned int sse2avx;
 811
 812 /* Encode scalar AVX instructions with specific vector length.  */
 813 static enum
 814   {
 815     vex128 = 0,
 816     vex256
 817   } avxscalar;
 818
 819 /* Encode VEX WIG instructions with specific vex.w.  */
 820 static enum
 821   {
 822     vexw0 = 0,
 823     vexw1
 824   } vexwig;
 825
 826 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 827 static enum
 828   {
 829     evexl128 = 0,
 830     evexl256,
 831     evexl512
 832   } evexlig;
 833
 834 /* Encode EVEX WIG instructions with specific evex.w.  */
 835 static enum
 836   {
 837     evexw0 = 0,
 838     evexw1
 839   } evexwig;
 840
 841 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 842 static enum rc_type evexrcig = rne;
 843
 844 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 845 static symbolS *GOT_symbol;
 846
 847 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 848 unsigned int x86_dwarf2_return_column;
 849
 850 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 851 int x86_cie_data_alignment;
 852
 853 /* Interface to relax_segment.
 854    There are 3 major relax states for 386 jump insns because the
 855    different types of jumps add different sizes to frags when we're
 856    figuring out what sort of jump to choose to reach a given label.
 857
 858    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 859    branches which are handled by md_estimate_size_before_relax() and
 860    i386_generic_table_relax_frag().  */
 861
 862 /* Types.  */
 863 #define UNCOND_JUMP 0
 864 #define COND_JUMP 1
 865 #define COND_JUMP86 2
 866 #define BRANCH_PADDING 3
 867 #define BRANCH_PREFIX 4
 868 #define FUSED_JCC_PADDING 5
 869
 870 /* Sizes.  */
 871 #define CODE16  1
 872 #define SMALL   0
 873 #define SMALL16 (SMALL | CODE16)
 874 #define BIG     2
 875 #define BIG16   (BIG | CODE16)
 876
 877 #ifndef INLINE
 878 #ifdef __GNUC__
 879 #define INLINE __inline__
 880 #else
 881 #define INLINE
 882 #endif
 883 #endif
 884
 885 #define ENCODE_RELAX_STATE(type, size) \
 886   ((relax_substateT) (((type) << 2) | (size)))
 887 #define TYPE_FROM_RELAX_STATE(s) \
 888   ((s) >> 2)
 889 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 890     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 891
 892 /* This table is used by relax_frag to promote short jumps to long
 893    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 894    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 895    don't allow a short jump in a 32 bit code segment to be promoted to
 896    a 16 bit offset jump because it's slower (requires data size
 897    prefix), and doesn't work, unless the destination is in the bottom
 898    64k of the code segment (The top 16 bits of eip are zeroed).  */
 899
 900 const relax_typeS md_relax_table[] =
 901 {
 902   /* The fields are:
 903      1) most positive reach of this state,
 904      2) most negative reach of this state,
 905      3) how many bytes this mode will have in the variable part of the frag
 906      4) which index into the table to try if we can't fit into this one.  */
 907
 908   /* UNCOND_JUMP states.  */
 909   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 910   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 911   /* dword jmp adds 4 bytes to frag:
 912      0 extra opcode bytes, 4 displacement bytes.  */
 913   {0, 0, 4, 0},
 914   /* word jmp adds 2 byte2 to frag:
 915      0 extra opcode bytes, 2 displacement bytes.  */
 916   {0, 0, 2, 0},
 917
 918   /* COND_JUMP states.  */
 919   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 920   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 921   /* dword conditionals adds 5 bytes to frag:
 922      1 extra opcode byte, 4 displacement bytes.  */
 923   {0, 0, 5, 0},
 924   /* word conditionals add 3 bytes to frag:
 925      1 extra opcode byte, 2 displacement bytes.  */
 926   {0, 0, 3, 0},
 927
 928   /* COND_JUMP86 states.  */
 929   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 930   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 931   /* dword conditionals adds 5 bytes to frag:
 932      1 extra opcode byte, 4 displacement bytes.  */
 933   {0, 0, 5, 0},
 934   /* word conditionals add 4 bytes to frag:
 935      1 displacement byte and a 3 byte long branch insn.  */
 936   {0, 0, 4, 0}
 937 };
 938
 939 static const arch_entry cpu_arch[] =
 940 {
 941   /* Do not replace the first two entries - i386_target_format()
 942      relies on them being there in this order.  */
 943   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 944     CPU_GENERIC32_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 946     CPU_GENERIC64_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 948     CPU_NONE_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 950     CPU_I186_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 952     CPU_I286_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 954     CPU_I386_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 956     CPU_I486_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 958     CPU_I586_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 960     CPU_I686_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 962     CPU_I586_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 964     CPU_PENTIUMPRO_FLAGS, 0 },
 965   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 966     CPU_P2_FLAGS, 0 },
 967   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 968     CPU_P3_FLAGS, 0 },
 969   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 970     CPU_P4_FLAGS, 0 },
 971   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 972     CPU_CORE_FLAGS, 0 },
 973   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 974     CPU_NOCONA_FLAGS, 0 },
 975   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 976     CPU_CORE_FLAGS, 1 },
 977   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 978     CPU_CORE_FLAGS, 0 },
 979   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 980     CPU_CORE2_FLAGS, 1 },
 981   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 982     CPU_CORE2_FLAGS, 0 },
 983   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 984     CPU_COREI7_FLAGS, 0 },
 985   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 986     CPU_L1OM_FLAGS, 0 },
 987   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 988     CPU_K1OM_FLAGS, 0 },
 989   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 990     CPU_IAMCU_FLAGS, 0 },
 991   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 992     CPU_K6_FLAGS, 0 },
 993   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 994     CPU_K6_2_FLAGS, 0 },
 995   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 996     CPU_ATHLON_FLAGS, 0 },
 997   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 998     CPU_K8_FLAGS, 1 },
 999   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
1000     CPU_K8_FLAGS, 0 },
1001   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1002     CPU_K8_FLAGS, 0 },
1003   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1004     CPU_AMDFAM10_FLAGS, 0 },
1005   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1006     CPU_BDVER1_FLAGS, 0 },
1007   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1008     CPU_BDVER2_FLAGS, 0 },
1009   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1010     CPU_BDVER3_FLAGS, 0 },
1011   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1012     CPU_BDVER4_FLAGS, 0 },
1013   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1014     CPU_ZNVER1_FLAGS, 0 },
1015   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1016     CPU_ZNVER2_FLAGS, 0 },
1017   { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1018     CPU_ZNVER3_FLAGS, 0 },
1019   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1020     CPU_BTVER1_FLAGS, 0 },
1021   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1022     CPU_BTVER2_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1024     CPU_8087_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1026     CPU_287_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1028     CPU_387_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1030     CPU_687_FLAGS, 0 },
1031   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1032     CPU_CMOV_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1034     CPU_FXSR_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1036     CPU_MMX_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1038     CPU_SSE_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1040     CPU_SSE2_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1042     CPU_SSE3_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1044     CPU_SSE4A_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1046     CPU_SSSE3_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1048     CPU_SSE4_1_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1050     CPU_SSE4_2_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1052     CPU_SSE4_2_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1054     CPU_AVX_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1056     CPU_AVX2_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1058     CPU_AVX512F_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1060     CPU_AVX512CD_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1062     CPU_AVX512ER_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1064     CPU_AVX512PF_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1066     CPU_AVX512DQ_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1068     CPU_AVX512BW_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1070     CPU_AVX512VL_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1072     CPU_VMX_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1074     CPU_VMFUNC_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1076     CPU_SMX_FLAGS, 0 },
1077   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1078     CPU_XSAVE_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1080     CPU_XSAVEOPT_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1082     CPU_XSAVEC_FLAGS, 0 },
1083   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1084     CPU_XSAVES_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1086     CPU_AES_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1088     CPU_PCLMUL_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1090     CPU_PCLMUL_FLAGS, 1 },
1091   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1092     CPU_FSGSBASE_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1094     CPU_RDRND_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1096     CPU_F16C_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1098     CPU_BMI2_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1100     CPU_FMA_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1102     CPU_FMA4_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1104     CPU_XOP_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1106     CPU_LWP_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1108     CPU_MOVBE_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1110     CPU_CX16_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1112     CPU_EPT_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1114     CPU_LZCNT_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1116     CPU_POPCNT_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1118     CPU_HLE_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1120     CPU_RTM_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1122     CPU_INVPCID_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1124     CPU_CLFLUSH_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1126     CPU_NOP_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1128     CPU_SYSCALL_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1130     CPU_RDTSCP_FLAGS, 0 },
1131   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1132     CPU_3DNOW_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1134     CPU_3DNOWA_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1136     CPU_PADLOCK_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1138     CPU_SVME_FLAGS, 1 },
1139   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1140     CPU_SVME_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1142     CPU_SSE4A_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1144     CPU_ABM_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1146     CPU_BMI_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1148     CPU_TBM_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1150     CPU_ADX_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1152     CPU_RDSEED_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1154     CPU_PRFCHW_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1156     CPU_SMAP_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1158     CPU_MPX_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1160     CPU_SHA_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1162     CPU_CLFLUSHOPT_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1164     CPU_PREFETCHWT1_FLAGS, 0 },
1165   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1166     CPU_SE1_FLAGS, 0 },
1167   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1168     CPU_CLWB_FLAGS, 0 },
1169   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1170     CPU_AVX512IFMA_FLAGS, 0 },
1171   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1172     CPU_AVX512VBMI_FLAGS, 0 },
1173   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1174     CPU_AVX512_4FMAPS_FLAGS, 0 },
1175   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1176     CPU_AVX512_4VNNIW_FLAGS, 0 },
1177   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1178     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1179   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1180     CPU_AVX512_VBMI2_FLAGS, 0 },
1181   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1182     CPU_AVX512_VNNI_FLAGS, 0 },
1183   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1184     CPU_AVX512_BITALG_FLAGS, 0 },
1185   { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1186     CPU_AVX_VNNI_FLAGS, 0 },
1187   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1188     CPU_CLZERO_FLAGS, 0 },
1189   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1190     CPU_MWAITX_FLAGS, 0 },
1191   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1192     CPU_OSPKE_FLAGS, 0 },
1193   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1194     CPU_RDPID_FLAGS, 0 },
1195   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1196     CPU_PTWRITE_FLAGS, 0 },
1197   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1198     CPU_IBT_FLAGS, 0 },
1199   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1200     CPU_SHSTK_FLAGS, 0 },
1201   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1202     CPU_GFNI_FLAGS, 0 },
1203   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1204     CPU_VAES_FLAGS, 0 },
1205   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1206     CPU_VPCLMULQDQ_FLAGS, 0 },
1207   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1208     CPU_WBNOINVD_FLAGS, 0 },
1209   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1210     CPU_PCONFIG_FLAGS, 0 },
1211   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1212     CPU_WAITPKG_FLAGS, 0 },
1213   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1214     CPU_CLDEMOTE_FLAGS, 0 },
1215   { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1216     CPU_AMX_INT8_FLAGS, 0 },
1217   { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1218     CPU_AMX_BF16_FLAGS, 0 },
1219   { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1220     CPU_AMX_TILE_FLAGS, 0 },
1221   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1222     CPU_MOVDIRI_FLAGS, 0 },
1223   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1224     CPU_MOVDIR64B_FLAGS, 0 },
1225   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1226     CPU_AVX512_BF16_FLAGS, 0 },
1227   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1228     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1229   { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1230     CPU_TDX_FLAGS, 0 },
1231   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1232     CPU_ENQCMD_FLAGS, 0 },
1233   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1234     CPU_SERIALIZE_FLAGS, 0 },
1235   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1236     CPU_RDPRU_FLAGS, 0 },
1237   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1238     CPU_MCOMMIT_FLAGS, 0 },
1239   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1240     CPU_SEV_ES_FLAGS, 0 },
1241   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1242     CPU_TSXLDTRK_FLAGS, 0 },
1243   { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1244     CPU_KL_FLAGS, 0 },
1245   { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1246     CPU_WIDEKL_FLAGS, 0 },
1247   { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1248     CPU_UINTR_FLAGS, 0 },
1249   { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1250     CPU_HRESET_FLAGS, 0 },
1251 };
1252
1253 static const noarch_entry cpu_noarch[] =
1254 {
1255   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1256   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1257   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1258   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1259   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1260   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1261   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1262   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1263   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1264   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1265   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1266   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1267   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1268   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1269   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1270   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1271   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1272   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1273   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1274   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1275   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1276   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1277   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1278   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1279   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1280   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1281   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1282   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1283   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1284   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1285   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1286   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1287   { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1288   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1289   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1290   { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1291   { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1292   { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1293   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1294   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1295   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1296   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1297     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1298   { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1299   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1300   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1301   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1302   { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1303   { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1304   { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1305   { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1306 };
1307
1308 #ifdef I386COFF
1309 /* Like s_lcomm_internal in gas/read.c but the alignment string
1310    is allowed to be optional.  */
1311
1312 static symbolS *
1313 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1314 {
1315   addressT align = 0;
1316
1317   SKIP_WHITESPACE ();
1318
1319   if (needs_align
1320       && *input_line_pointer == ',')
1321     {
1322       align = parse_align (needs_align - 1);
1323
1324       if (align == (addressT) -1)
1325         return NULL;
1326     }
1327   else
1328     {
1329       if (size >= 8)
1330         align = 3;
1331       else if (size >= 4)
1332         align = 2;
1333       else if (size >= 2)
1334         align = 1;
1335       else
1336         align = 0;
1337     }
1338
1339   bss_alloc (symbolP, size, align);
1340   return symbolP;
1341 }
1342
1343 static void
1344 pe_lcomm (int needs_align)
1345 {
1346   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1347 }
1348 #endif
1349
1350 const pseudo_typeS md_pseudo_table[] =
1351 {
1352 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1353   {"align", s_align_bytes, 0},
1354 #else
1355   {"align", s_align_ptwo, 0},
1356 #endif
1357   {"arch", set_cpu_arch, 0},
1358 #ifndef I386COFF
1359   {"bss", s_bss, 0},
1360 #else
1361   {"lcomm", pe_lcomm, 1},
1362 #endif
1363   {"ffloat", float_cons, 'f'},
1364   {"dfloat", float_cons, 'd'},
1365   {"tfloat", float_cons, 'x'},
1366   {"value", cons, 2},
1367   {"slong", signed_cons, 4},
1368   {"noopt", s_ignore, 0},
1369   {"optim", s_ignore, 0},
1370   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1371   {"code16", set_code_flag, CODE_16BIT},
1372   {"code32", set_code_flag, CODE_32BIT},
1373 #ifdef BFD64
1374   {"code64", set_code_flag, CODE_64BIT},
1375 #endif
1376   {"intel_syntax", set_intel_syntax, 1},
1377   {"att_syntax", set_intel_syntax, 0},
1378   {"intel_mnemonic", set_intel_mnemonic, 1},
1379   {"att_mnemonic", set_intel_mnemonic, 0},
1380   {"allow_index_reg", set_allow_index_reg, 1},
1381   {"disallow_index_reg", set_allow_index_reg, 0},
1382   {"sse_check", set_check, 0},
1383   {"operand_check", set_check, 1},
1384 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1385   {"largecomm", handle_large_common, 0},
1386 #else
1387   {"file", dwarf2_directive_file, 0},
1388   {"loc", dwarf2_directive_loc, 0},
1389   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1390 #endif
1391 #ifdef TE_PE
1392   {"secrel32", pe_directive_secrel, 0},
1393 #endif
1394   {0, 0, 0}
1395 };
1396
1397 /* For interface with expression ().  */
1398 extern char *input_line_pointer;
1399
1400 /* Hash table for instruction mnemonic lookup.  */
1401 static htab_t op_hash;
1402
1403 /* Hash table for register lookup.  */
1404 static htab_t reg_hash;
1405 \f
1406   /* Various efficient no-op patterns for aligning code labels.
1407      Note: Don't try to assemble the instructions in the comments.
1408      0L and 0w are not legal.  */
1409 static const unsigned char f32_1[] =
1410   {0x90};                               /* nop                  */
1411 static const unsigned char f32_2[] =
1412   {0x66,0x90};                          /* xchg %ax,%ax         */
1413 static const unsigned char f32_3[] =
1414   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1415 static const unsigned char f32_4[] =
1416   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1417 static const unsigned char f32_6[] =
1418   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1419 static const unsigned char f32_7[] =
1420   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1421 static const unsigned char f16_3[] =
1422   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1423 static const unsigned char f16_4[] =
1424   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1425 static const unsigned char jump_disp8[] =
1426   {0xeb};                               /* jmp disp8           */
1427 static const unsigned char jump32_disp32[] =
1428   {0xe9};                               /* jmp disp32          */
1429 static const unsigned char jump16_disp32[] =
1430   {0x66,0xe9};                          /* jmp disp32          */
1431 /* 32-bit NOPs patterns.  */
1432 static const unsigned char *const f32_patt[] = {
1433   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1434 };
1435 /* 16-bit NOPs patterns.  */
1436 static const unsigned char *const f16_patt[] = {
1437   f32_1, f32_2, f16_3, f16_4
1438 };
1439 /* nopl (%[re]ax) */
1440 static const unsigned char alt_3[] =
1441   {0x0f,0x1f,0x00};
1442 /* nopl 0(%[re]ax) */
1443 static const unsigned char alt_4[] =
1444   {0x0f,0x1f,0x40,0x00};
1445 /* nopl 0(%[re]ax,%[re]ax,1) */
1446 static const unsigned char alt_5[] =
1447   {0x0f,0x1f,0x44,0x00,0x00};
1448 /* nopw 0(%[re]ax,%[re]ax,1) */
1449 static const unsigned char alt_6[] =
1450   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1451 /* nopl 0L(%[re]ax) */
1452 static const unsigned char alt_7[] =
1453   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1454 /* nopl 0L(%[re]ax,%[re]ax,1) */
1455 static const unsigned char alt_8[] =
1456   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1457 /* nopw 0L(%[re]ax,%[re]ax,1) */
1458 static const unsigned char alt_9[] =
1459   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1460 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1461 static const unsigned char alt_10[] =
1462   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1463 /* data16 nopw %cs:0L(%eax,%eax,1) */
1464 static const unsigned char alt_11[] =
1465   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1466 /* 32-bit and 64-bit NOPs patterns.  */
1467 static const unsigned char *const alt_patt[] = {
1468   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1469   alt_9, alt_10, alt_11
1470 };
1471
1472 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1473    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1474
1475 static void
1476 i386_output_nops (char *where, const unsigned char *const *patt,
1477                   int count, int max_single_nop_size)
1478
1479 {
1480   /* Place the longer NOP first.  */
1481   int last;
1482   int offset;
1483   const unsigned char *nops;
1484
1485   if (max_single_nop_size < 1)
1486     {
1487       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1488                 max_single_nop_size);
1489       return;
1490     }
1491
1492   nops = patt[max_single_nop_size - 1];
1493
1494   /* Use the smaller one if the requsted one isn't available.  */
1495   if (nops == NULL)
1496     {
1497       max_single_nop_size--;
1498       nops = patt[max_single_nop_size - 1];
1499     }
1500
1501   last = count % max_single_nop_size;
1502
1503   count -= last;
1504   for (offset = 0; offset < count; offset += max_single_nop_size)
1505     memcpy (where + offset, nops, max_single_nop_size);
1506
1507   if (last)
1508     {
1509       nops = patt[last - 1];
1510       if (nops == NULL)
1511         {
1512           /* Use the smaller one plus one-byte NOP if the needed one
1513              isn't available.  */
1514           last--;
1515           nops = patt[last - 1];
1516           memcpy (where + offset, nops, last);
1517           where[offset + last] = *patt[0];
1518         }
1519       else
1520         memcpy (where + offset, nops, last);
1521     }
1522 }
1523
1524 static INLINE int
1525 fits_in_imm7 (offsetT num)
1526 {
1527   return (num & 0x7f) == num;
1528 }
1529
1530 static INLINE int
1531 fits_in_imm31 (offsetT num)
1532 {
1533   return (num & 0x7fffffff) == num;
1534 }
1535
1536 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1537    single NOP instruction LIMIT.  */
1538
1539 void
1540 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1541 {
1542   const unsigned char *const *patt = NULL;
1543   int max_single_nop_size;
1544   /* Maximum number of NOPs before switching to jump over NOPs.  */
1545   int max_number_of_nops;
1546
1547   switch (fragP->fr_type)
1548     {
1549     case rs_fill_nop:
1550     case rs_align_code:
1551       break;
1552     case rs_machine_dependent:
1553       /* Allow NOP padding for jumps and calls.  */
1554       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1555           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1556         break;
1557       /* Fall through.  */
1558     default:
1559       return;
1560     }
1561
1562   /* We need to decide which NOP sequence to use for 32bit and
1563      64bit. When -mtune= is used:
1564
1565      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1566      PROCESSOR_GENERIC32, f32_patt will be used.
1567      2. For the rest, alt_patt will be used.
1568
1569      When -mtune= isn't used, alt_patt will be used if
1570      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1571      be used.
1572
1573      When -march= or .arch is used, we can't use anything beyond
1574      cpu_arch_isa_flags.   */
1575
1576   if (flag_code == CODE_16BIT)
1577     {
1578       patt = f16_patt;
1579       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1580       /* Limit number of NOPs to 2 in 16-bit mode.  */
1581       max_number_of_nops = 2;
1582     }
1583   else
1584     {
1585       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1586         {
1587           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1588           switch (cpu_arch_tune)
1589             {
1590             case PROCESSOR_UNKNOWN:
1591               /* We use cpu_arch_isa_flags to check if we SHOULD
1592                  optimize with nops.  */
1593               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1594                 patt = alt_patt;
1595               else
1596                 patt = f32_patt;
1597               break;
1598             case PROCESSOR_PENTIUM4:
1599             case PROCESSOR_NOCONA:
1600             case PROCESSOR_CORE:
1601             case PROCESSOR_CORE2:
1602             case PROCESSOR_COREI7:
1603             case PROCESSOR_L1OM:
1604             case PROCESSOR_K1OM:
1605             case PROCESSOR_GENERIC64:
1606             case PROCESSOR_K6:
1607             case PROCESSOR_ATHLON:
1608             case PROCESSOR_K8:
1609             case PROCESSOR_AMDFAM10:
1610             case PROCESSOR_BD:
1611             case PROCESSOR_ZNVER:
1612             case PROCESSOR_BT:
1613               patt = alt_patt;
1614               break;
1615             case PROCESSOR_I386:
1616             case PROCESSOR_I486:
1617             case PROCESSOR_PENTIUM:
1618             case PROCESSOR_PENTIUMPRO:
1619             case PROCESSOR_IAMCU:
1620             case PROCESSOR_GENERIC32:
1621               patt = f32_patt;
1622               break;
1623             }
1624         }
1625       else
1626         {
1627           switch (fragP->tc_frag_data.tune)
1628             {
1629             case PROCESSOR_UNKNOWN:
1630               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1631                  PROCESSOR_UNKNOWN.  */
1632               abort ();
1633               break;
1634
1635             case PROCESSOR_I386:
1636             case PROCESSOR_I486:
1637             case PROCESSOR_PENTIUM:
1638             case PROCESSOR_IAMCU:
1639             case PROCESSOR_K6:
1640             case PROCESSOR_ATHLON:
1641             case PROCESSOR_K8:
1642             case PROCESSOR_AMDFAM10:
1643             case PROCESSOR_BD:
1644             case PROCESSOR_ZNVER:
1645             case PROCESSOR_BT:
1646             case PROCESSOR_GENERIC32:
1647               /* We use cpu_arch_isa_flags to check if we CAN optimize
1648                  with nops.  */
1649               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1650                 patt = alt_patt;
1651               else
1652                 patt = f32_patt;
1653               break;
1654             case PROCESSOR_PENTIUMPRO:
1655             case PROCESSOR_PENTIUM4:
1656             case PROCESSOR_NOCONA:
1657             case PROCESSOR_CORE:
1658             case PROCESSOR_CORE2:
1659             case PROCESSOR_COREI7:
1660             case PROCESSOR_L1OM:
1661             case PROCESSOR_K1OM:
1662               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1663                 patt = alt_patt;
1664               else
1665                 patt = f32_patt;
1666               break;
1667             case PROCESSOR_GENERIC64:
1668               patt = alt_patt;
1669               break;
1670             }
1671         }
1672
1673       if (patt == f32_patt)
1674         {
1675           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1676           /* Limit number of NOPs to 2 for older processors.  */
1677           max_number_of_nops = 2;
1678         }
1679       else
1680         {
1681           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1682           /* Limit number of NOPs to 7 for newer processors.  */
1683           max_number_of_nops = 7;
1684         }
1685     }
1686
1687   if (limit == 0)
1688     limit = max_single_nop_size;
1689
1690   if (fragP->fr_type == rs_fill_nop)
1691     {
1692       /* Output NOPs for .nop directive.  */
1693       if (limit > max_single_nop_size)
1694         {
1695           as_bad_where (fragP->fr_file, fragP->fr_line,
1696                         _("invalid single nop size: %d "
1697                           "(expect within [0, %d])"),
1698                         limit, max_single_nop_size);
1699           return;
1700         }
1701     }
1702   else if (fragP->fr_type != rs_machine_dependent)
1703     fragP->fr_var = count;
1704
1705   if ((count / max_single_nop_size) > max_number_of_nops)
1706     {
1707       /* Generate jump over NOPs.  */
1708       offsetT disp = count - 2;
1709       if (fits_in_imm7 (disp))
1710         {
1711           /* Use "jmp disp8" if possible.  */
1712           count = disp;
1713           where[0] = jump_disp8[0];
1714           where[1] = count;
1715           where += 2;
1716         }
1717       else
1718         {
1719           unsigned int size_of_jump;
1720
1721           if (flag_code == CODE_16BIT)
1722             {
1723               where[0] = jump16_disp32[0];
1724               where[1] = jump16_disp32[1];
1725               size_of_jump = 2;
1726             }
1727           else
1728             {
1729               where[0] = jump32_disp32[0];
1730               size_of_jump = 1;
1731             }
1732
1733           count -= size_of_jump + 4;
1734           if (!fits_in_imm31 (count))
1735             {
1736               as_bad_where (fragP->fr_file, fragP->fr_line,
1737                             _("jump over nop padding out of range"));
1738               return;
1739             }
1740
1741           md_number_to_chars (where + size_of_jump, count, 4);
1742           where += size_of_jump + 4;
1743         }
1744     }
1745
1746   /* Generate multiple NOPs.  */
1747   i386_output_nops (where, patt, count, limit);
1748 }
1749
1750 static INLINE int
1751 operand_type_all_zero (const union i386_operand_type *x)
1752 {
1753   switch (ARRAY_SIZE(x->array))
1754     {
1755     case 3:
1756       if (x->array[2])
1757         return 0;
1758       /* Fall through.  */
1759     case 2:
1760       if (x->array[1])
1761         return 0;
1762       /* Fall through.  */
1763     case 1:
1764       return !x->array[0];
1765     default:
1766       abort ();
1767     }
1768 }
1769
1770 static INLINE void
1771 operand_type_set (union i386_operand_type *x, unsigned int v)
1772 {
1773   switch (ARRAY_SIZE(x->array))
1774     {
1775     case 3:
1776       x->array[2] = v;
1777       /* Fall through.  */
1778     case 2:
1779       x->array[1] = v;
1780       /* Fall through.  */
1781     case 1:
1782       x->array[0] = v;
1783       /* Fall through.  */
1784       break;
1785     default:
1786       abort ();
1787     }
1788
1789   x->bitfield.class = ClassNone;
1790   x->bitfield.instance = InstanceNone;
1791 }
1792
1793 static INLINE int
1794 operand_type_equal (const union i386_operand_type *x,
1795                     const union i386_operand_type *y)
1796 {
1797   switch (ARRAY_SIZE(x->array))
1798     {
1799     case 3:
1800       if (x->array[2] != y->array[2])
1801         return 0;
1802       /* Fall through.  */
1803     case 2:
1804       if (x->array[1] != y->array[1])
1805         return 0;
1806       /* Fall through.  */
1807     case 1:
1808       return x->array[0] == y->array[0];
1809       break;
1810     default:
1811       abort ();
1812     }
1813 }
1814
1815 static INLINE int
1816 cpu_flags_all_zero (const union i386_cpu_flags *x)
1817 {
1818   switch (ARRAY_SIZE(x->array))
1819     {
1820     case 4:
1821       if (x->array[3])
1822         return 0;
1823       /* Fall through.  */
1824     case 3:
1825       if (x->array[2])
1826         return 0;
1827       /* Fall through.  */
1828     case 2:
1829       if (x->array[1])
1830         return 0;
1831       /* Fall through.  */
1832     case 1:
1833       return !x->array[0];
1834     default:
1835       abort ();
1836     }
1837 }
1838
1839 static INLINE int
1840 cpu_flags_equal (const union i386_cpu_flags *x,
1841                  const union i386_cpu_flags *y)
1842 {
1843   switch (ARRAY_SIZE(x->array))
1844     {
1845     case 4:
1846       if (x->array[3] != y->array[3])
1847         return 0;
1848       /* Fall through.  */
1849     case 3:
1850       if (x->array[2] != y->array[2])
1851         return 0;
1852       /* Fall through.  */
1853     case 2:
1854       if (x->array[1] != y->array[1])
1855         return 0;
1856       /* Fall through.  */
1857     case 1:
1858       return x->array[0] == y->array[0];
1859       break;
1860     default:
1861       abort ();
1862     }
1863 }
1864
1865 static INLINE int
1866 cpu_flags_check_cpu64 (i386_cpu_flags f)
1867 {
1868   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1869            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1870 }
1871
1872 static INLINE i386_cpu_flags
1873 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1874 {
1875   switch (ARRAY_SIZE (x.array))
1876     {
1877     case 4:
1878       x.array [3] &= y.array [3];
1879       /* Fall through.  */
1880     case 3:
1881       x.array [2] &= y.array [2];
1882       /* Fall through.  */
1883     case 2:
1884       x.array [1] &= y.array [1];
1885       /* Fall through.  */
1886     case 1:
1887       x.array [0] &= y.array [0];
1888       break;
1889     default:
1890       abort ();
1891     }
1892   return x;
1893 }
1894
1895 static INLINE i386_cpu_flags
1896 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1897 {
1898   switch (ARRAY_SIZE (x.array))
1899     {
1900     case 4:
1901       x.array [3] |= y.array [3];
1902       /* Fall through.  */
1903     case 3:
1904       x.array [2] |= y.array [2];
1905       /* Fall through.  */
1906     case 2:
1907       x.array [1] |= y.array [1];
1908       /* Fall through.  */
1909     case 1:
1910       x.array [0] |= y.array [0];
1911       break;
1912     default:
1913       abort ();
1914     }
1915   return x;
1916 }
1917
1918 static INLINE i386_cpu_flags
1919 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1920 {
1921   switch (ARRAY_SIZE (x.array))
1922     {
1923     case 4:
1924       x.array [3] &= ~y.array [3];
1925       /* Fall through.  */
1926     case 3:
1927       x.array [2] &= ~y.array [2];
1928       /* Fall through.  */
1929     case 2:
1930       x.array [1] &= ~y.array [1];
1931       /* Fall through.  */
1932     case 1:
1933       x.array [0] &= ~y.array [0];
1934       break;
1935     default:
1936       abort ();
1937     }
1938   return x;
1939 }
1940
1941 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1942
1943 #define CPU_FLAGS_ARCH_MATCH            0x1
1944 #define CPU_FLAGS_64BIT_MATCH           0x2
1945
1946 #define CPU_FLAGS_PERFECT_MATCH \
1947   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1948
1949 /* Return CPU flags match bits. */
1950
1951 static int
1952 cpu_flags_match (const insn_template *t)
1953 {
1954   i386_cpu_flags x = t->cpu_flags;
1955   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1956
1957   x.bitfield.cpu64 = 0;
1958   x.bitfield.cpuno64 = 0;
1959
1960   if (cpu_flags_all_zero (&x))
1961     {
1962       /* This instruction is available on all archs.  */
1963       match |= CPU_FLAGS_ARCH_MATCH;
1964     }
1965   else
1966     {
1967       /* This instruction is available only on some archs.  */
1968       i386_cpu_flags cpu = cpu_arch_flags;
1969
1970       /* AVX512VL is no standalone feature - match it and then strip it.  */
1971       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1972         return match;
1973       x.bitfield.cpuavx512vl = 0;
1974
1975       cpu = cpu_flags_and (x, cpu);
1976       if (!cpu_flags_all_zero (&cpu))
1977         {
1978           if (x.bitfield.cpuavx)
1979             {
1980               /* We need to check a few extra flags with AVX.  */
1981               if (cpu.bitfield.cpuavx
1982                   && (!t->opcode_modifier.sse2avx
1983                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1984                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1985                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1986                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1987                 match |= CPU_FLAGS_ARCH_MATCH;
1988             }
1989           else if (x.bitfield.cpuavx512f)
1990             {
1991               /* We need to check a few extra flags with AVX512F.  */
1992               if (cpu.bitfield.cpuavx512f
1993                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1994                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1995                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1996                 match |= CPU_FLAGS_ARCH_MATCH;
1997             }
1998           else
1999             match |= CPU_FLAGS_ARCH_MATCH;
2000         }
2001     }
2002   return match;
2003 }
2004
2005 static INLINE i386_operand_type
2006 operand_type_and (i386_operand_type x, i386_operand_type y)
2007 {
2008   if (x.bitfield.class != y.bitfield.class)
2009     x.bitfield.class = ClassNone;
2010   if (x.bitfield.instance != y.bitfield.instance)
2011     x.bitfield.instance = InstanceNone;
2012
2013   switch (ARRAY_SIZE (x.array))
2014     {
2015     case 3:
2016       x.array [2] &= y.array [2];
2017       /* Fall through.  */
2018     case 2:
2019       x.array [1] &= y.array [1];
2020       /* Fall through.  */
2021     case 1:
2022       x.array [0] &= y.array [0];
2023       break;
2024     default:
2025       abort ();
2026     }
2027   return x;
2028 }
2029
2030 static INLINE i386_operand_type
2031 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2032 {
2033   gas_assert (y.bitfield.class == ClassNone);
2034   gas_assert (y.bitfield.instance == InstanceNone);
2035
2036   switch (ARRAY_SIZE (x.array))
2037     {
2038     case 3:
2039       x.array [2] &= ~y.array [2];
2040       /* Fall through.  */
2041     case 2:
2042       x.array [1] &= ~y.array [1];
2043       /* Fall through.  */
2044     case 1:
2045       x.array [0] &= ~y.array [0];
2046       break;
2047     default:
2048       abort ();
2049     }
2050   return x;
2051 }
2052
2053 static INLINE i386_operand_type
2054 operand_type_or (i386_operand_type x, i386_operand_type y)
2055 {
2056   gas_assert (x.bitfield.class == ClassNone ||
2057               y.bitfield.class == ClassNone ||
2058               x.bitfield.class == y.bitfield.class);
2059   gas_assert (x.bitfield.instance == InstanceNone ||
2060               y.bitfield.instance == InstanceNone ||
2061               x.bitfield.instance == y.bitfield.instance);
2062
2063   switch (ARRAY_SIZE (x.array))
2064     {
2065     case 3:
2066       x.array [2] |= y.array [2];
2067       /* Fall through.  */
2068     case 2:
2069       x.array [1] |= y.array [1];
2070       /* Fall through.  */
2071     case 1:
2072       x.array [0] |= y.array [0];
2073       break;
2074     default:
2075       abort ();
2076     }
2077   return x;
2078 }
2079
2080 static INLINE i386_operand_type
2081 operand_type_xor (i386_operand_type x, i386_operand_type y)
2082 {
2083   gas_assert (y.bitfield.class == ClassNone);
2084   gas_assert (y.bitfield.instance == InstanceNone);
2085
2086   switch (ARRAY_SIZE (x.array))
2087     {
2088     case 3:
2089       x.array [2] ^= y.array [2];
2090       /* Fall through.  */
2091     case 2:
2092       x.array [1] ^= y.array [1];
2093       /* Fall through.  */
2094     case 1:
2095       x.array [0] ^= y.array [0];
2096       break;
2097     default:
2098       abort ();
2099     }
2100   return x;
2101 }
2102
2103 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2104 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2105 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2106 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2107 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2108 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2109 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2110 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2111 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2112 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2113 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2114 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2115 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2116 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2117 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2118 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2119 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2120
2121 enum operand_type
2122 {
2123   reg,
2124   imm,
2125   disp,
2126   anymem
2127 };
2128
2129 static INLINE int
2130 operand_type_check (i386_operand_type t, enum operand_type c)
2131 {
2132   switch (c)
2133     {
2134     case reg:
2135       return t.bitfield.class == Reg;
2136
2137     case imm:
2138       return (t.bitfield.imm8
2139               || t.bitfield.imm8s
2140               || t.bitfield.imm16
2141               || t.bitfield.imm32
2142               || t.bitfield.imm32s
2143               || t.bitfield.imm64);
2144
2145     case disp:
2146       return (t.bitfield.disp8
2147               || t.bitfield.disp16
2148               || t.bitfield.disp32
2149               || t.bitfield.disp32s
2150               || t.bitfield.disp64);
2151
2152     case anymem:
2153       return (t.bitfield.disp8
2154               || t.bitfield.disp16
2155               || t.bitfield.disp32
2156               || t.bitfield.disp32s
2157               || t.bitfield.disp64
2158               || t.bitfield.baseindex);
2159
2160     default:
2161       abort ();
2162     }
2163
2164   return 0;
2165 }
2166
2167 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2168    between operand GIVEN and opeand WANTED for instruction template T.  */
2169
2170 static INLINE int
2171 match_operand_size (const insn_template *t, unsigned int wanted,
2172                     unsigned int given)
2173 {
2174   return !((i.types[given].bitfield.byte
2175             && !t->operand_types[wanted].bitfield.byte)
2176            || (i.types[given].bitfield.word
2177                && !t->operand_types[wanted].bitfield.word)
2178            || (i.types[given].bitfield.dword
2179                && !t->operand_types[wanted].bitfield.dword)
2180            || (i.types[given].bitfield.qword
2181                && !t->operand_types[wanted].bitfield.qword)
2182            || (i.types[given].bitfield.tbyte
2183                && !t->operand_types[wanted].bitfield.tbyte));
2184 }
2185
2186 /* Return 1 if there is no conflict in SIMD register between operand
2187    GIVEN and opeand WANTED for instruction template T.  */
2188
2189 static INLINE int
2190 match_simd_size (const insn_template *t, unsigned int wanted,
2191                  unsigned int given)
2192 {
2193   return !((i.types[given].bitfield.xmmword
2194             && !t->operand_types[wanted].bitfield.xmmword)
2195            || (i.types[given].bitfield.ymmword
2196                && !t->operand_types[wanted].bitfield.ymmword)
2197            || (i.types[given].bitfield.zmmword
2198                && !t->operand_types[wanted].bitfield.zmmword)
2199            || (i.types[given].bitfield.tmmword
2200                && !t->operand_types[wanted].bitfield.tmmword));
2201 }
2202
2203 /* Return 1 if there is no conflict in any size between operand GIVEN
2204    and opeand WANTED for instruction template T.  */
2205
2206 static INLINE int
2207 match_mem_size (const insn_template *t, unsigned int wanted,
2208                 unsigned int given)
2209 {
2210   return (match_operand_size (t, wanted, given)
2211           && !((i.types[given].bitfield.unspecified
2212                 && !i.broadcast
2213                 && !t->operand_types[wanted].bitfield.unspecified)
2214                || (i.types[given].bitfield.fword
2215                    && !t->operand_types[wanted].bitfield.fword)
2216                /* For scalar opcode templates to allow register and memory
2217                   operands at the same time, some special casing is needed
2218                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2219                   down-conversion vpmov*.  */
2220                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2221                     && t->operand_types[wanted].bitfield.byte
2222                        + t->operand_types[wanted].bitfield.word
2223                        + t->operand_types[wanted].bitfield.dword
2224                        + t->operand_types[wanted].bitfield.qword
2225                        > !!t->opcode_modifier.broadcast)
2226                    ? (i.types[given].bitfield.xmmword
2227                       || i.types[given].bitfield.ymmword
2228                       || i.types[given].bitfield.zmmword)
2229                    : !match_simd_size(t, wanted, given))));
2230 }
2231
2232 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2233    operands for instruction template T, and it has MATCH_REVERSE set if there
2234    is no size conflict on any operands for the template with operands reversed
2235    (and the template allows for reversing in the first place).  */
2236
2237 #define MATCH_STRAIGHT 1
2238 #define MATCH_REVERSE  2
2239
2240 static INLINE unsigned int
2241 operand_size_match (const insn_template *t)
2242 {
2243   unsigned int j, match = MATCH_STRAIGHT;
2244
2245   /* Don't check non-absolute jump instructions.  */
2246   if (t->opcode_modifier.jump
2247       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2248     return match;
2249
2250   /* Check memory and accumulator operand size.  */
2251   for (j = 0; j < i.operands; j++)
2252     {
2253       if (i.types[j].bitfield.class != Reg
2254           && i.types[j].bitfield.class != RegSIMD
2255           && t->opcode_modifier.anysize)
2256         continue;
2257
2258       if (t->operand_types[j].bitfield.class == Reg
2259           && !match_operand_size (t, j, j))
2260         {
2261           match = 0;
2262           break;
2263         }
2264
2265       if (t->operand_types[j].bitfield.class == RegSIMD
2266           && !match_simd_size (t, j, j))
2267         {
2268           match = 0;
2269           break;
2270         }
2271
2272       if (t->operand_types[j].bitfield.instance == Accum
2273           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2274         {
2275           match = 0;
2276           break;
2277         }
2278
2279       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2280         {
2281           match = 0;
2282           break;
2283         }
2284     }
2285
2286   if (!t->opcode_modifier.d)
2287     {
2288     mismatch:
2289       if (!match)
2290         i.error = operand_size_mismatch;
2291       return match;
2292     }
2293
2294   /* Check reverse.  */
2295   gas_assert (i.operands >= 2 && i.operands <= 3);
2296
2297   for (j = 0; j < i.operands; j++)
2298     {
2299       unsigned int given = i.operands - j - 1;
2300
2301       if (t->operand_types[j].bitfield.class == Reg
2302           && !match_operand_size (t, j, given))
2303         goto mismatch;
2304
2305       if (t->operand_types[j].bitfield.class == RegSIMD
2306           && !match_simd_size (t, j, given))
2307         goto mismatch;
2308
2309       if (t->operand_types[j].bitfield.instance == Accum
2310           && (!match_operand_size (t, j, given)
2311               || !match_simd_size (t, j, given)))
2312         goto mismatch;
2313
2314       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2315         goto mismatch;
2316     }
2317
2318   return match | MATCH_REVERSE;
2319 }
2320
2321 static INLINE int
2322 operand_type_match (i386_operand_type overlap,
2323                     i386_operand_type given)
2324 {
2325   i386_operand_type temp = overlap;
2326
2327   temp.bitfield.unspecified = 0;
2328   temp.bitfield.byte = 0;
2329   temp.bitfield.word = 0;
2330   temp.bitfield.dword = 0;
2331   temp.bitfield.fword = 0;
2332   temp.bitfield.qword = 0;
2333   temp.bitfield.tbyte = 0;
2334   temp.bitfield.xmmword = 0;
2335   temp.bitfield.ymmword = 0;
2336   temp.bitfield.zmmword = 0;
2337   temp.bitfield.tmmword = 0;
2338   if (operand_type_all_zero (&temp))
2339     goto mismatch;
2340
2341   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2342     return 1;
2343
2344  mismatch:
2345   i.error = operand_type_mismatch;
2346   return 0;
2347 }
2348
2349 /* If given types g0 and g1 are registers they must be of the same type
2350    unless the expected operand type register overlap is null.
2351    Some Intel syntax memory operand size checking also happens here.  */
2352
2353 static INLINE int
2354 operand_type_register_match (i386_operand_type g0,
2355                              i386_operand_type t0,
2356                              i386_operand_type g1,
2357                              i386_operand_type t1)
2358 {
2359   if (g0.bitfield.class != Reg
2360       && g0.bitfield.class != RegSIMD
2361       && (!operand_type_check (g0, anymem)
2362           || g0.bitfield.unspecified
2363           || (t0.bitfield.class != Reg
2364               && t0.bitfield.class != RegSIMD)))
2365     return 1;
2366
2367   if (g1.bitfield.class != Reg
2368       && g1.bitfield.class != RegSIMD
2369       && (!operand_type_check (g1, anymem)
2370           || g1.bitfield.unspecified
2371           || (t1.bitfield.class != Reg
2372               && t1.bitfield.class != RegSIMD)))
2373     return 1;
2374
2375   if (g0.bitfield.byte == g1.bitfield.byte
2376       && g0.bitfield.word == g1.bitfield.word
2377       && g0.bitfield.dword == g1.bitfield.dword
2378       && g0.bitfield.qword == g1.bitfield.qword
2379       && g0.bitfield.xmmword == g1.bitfield.xmmword
2380       && g0.bitfield.ymmword == g1.bitfield.ymmword
2381       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2382     return 1;
2383
2384   if (!(t0.bitfield.byte & t1.bitfield.byte)
2385       && !(t0.bitfield.word & t1.bitfield.word)
2386       && !(t0.bitfield.dword & t1.bitfield.dword)
2387       && !(t0.bitfield.qword & t1.bitfield.qword)
2388       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2389       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2390       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2391     return 1;
2392
2393   i.error = register_type_mismatch;
2394
2395   return 0;
2396 }
2397
2398 static INLINE unsigned int
2399 register_number (const reg_entry *r)
2400 {
2401   unsigned int nr = r->reg_num;
2402
2403   if (r->reg_flags & RegRex)
2404     nr += 8;
2405
2406   if (r->reg_flags & RegVRex)
2407     nr += 16;
2408
2409   return nr;
2410 }
2411
2412 static INLINE unsigned int
2413 mode_from_disp_size (i386_operand_type t)
2414 {
2415   if (t.bitfield.disp8)
2416     return 1;
2417   else if (t.bitfield.disp16
2418            || t.bitfield.disp32
2419            || t.bitfield.disp32s)
2420     return 2;
2421   else
2422     return 0;
2423 }
2424
2425 static INLINE int
2426 fits_in_signed_byte (addressT num)
2427 {
2428   return num + 0x80 <= 0xff;
2429 }
2430
2431 static INLINE int
2432 fits_in_unsigned_byte (addressT num)
2433 {
2434   return num <= 0xff;
2435 }
2436
2437 static INLINE int
2438 fits_in_unsigned_word (addressT num)
2439 {
2440   return num <= 0xffff;
2441 }
2442
2443 static INLINE int
2444 fits_in_signed_word (addressT num)
2445 {
2446   return num + 0x8000 <= 0xffff;
2447 }
2448
2449 static INLINE int
2450 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2451 {
2452 #ifndef BFD64
2453   return 1;
2454 #else
2455   return num + 0x80000000 <= 0xffffffff;
2456 #endif
2457 }                               /* fits_in_signed_long() */
2458
2459 static INLINE int
2460 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2461 {
2462 #ifndef BFD64
2463   return 1;
2464 #else
2465   return num <= 0xffffffff;
2466 #endif
2467 }                               /* fits_in_unsigned_long() */
2468
2469 static INLINE int
2470 fits_in_disp8 (offsetT num)
2471 {
2472   int shift = i.memshift;
2473   unsigned int mask;
2474
2475   if (shift == -1)
2476     abort ();
2477
2478   mask = (1 << shift) - 1;
2479
2480   /* Return 0 if NUM isn't properly aligned.  */
2481   if ((num & mask))
2482     return 0;
2483
2484   /* Check if NUM will fit in 8bit after shift.  */
2485   return fits_in_signed_byte (num >> shift);
2486 }
2487
2488 static INLINE int
2489 fits_in_imm4 (offsetT num)
2490 {
2491   return (num & 0xf) == num;
2492 }
2493
2494 static i386_operand_type
2495 smallest_imm_type (offsetT num)
2496 {
2497   i386_operand_type t;
2498
2499   operand_type_set (&t, 0);
2500   t.bitfield.imm64 = 1;
2501
2502   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2503     {
2504       /* This code is disabled on the 486 because all the Imm1 forms
2505          in the opcode table are slower on the i486.  They're the
2506          versions with the implicitly specified single-position
2507          displacement, which has another syntax if you really want to
2508          use that form.  */
2509       t.bitfield.imm1 = 1;
2510       t.bitfield.imm8 = 1;
2511       t.bitfield.imm8s = 1;
2512       t.bitfield.imm16 = 1;
2513       t.bitfield.imm32 = 1;
2514       t.bitfield.imm32s = 1;
2515     }
2516   else if (fits_in_signed_byte (num))
2517     {
2518       t.bitfield.imm8 = 1;
2519       t.bitfield.imm8s = 1;
2520       t.bitfield.imm16 = 1;
2521       t.bitfield.imm32 = 1;
2522       t.bitfield.imm32s = 1;
2523     }
2524   else if (fits_in_unsigned_byte (num))
2525     {
2526       t.bitfield.imm8 = 1;
2527       t.bitfield.imm16 = 1;
2528       t.bitfield.imm32 = 1;
2529       t.bitfield.imm32s = 1;
2530     }
2531   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2532     {
2533       t.bitfield.imm16 = 1;
2534       t.bitfield.imm32 = 1;
2535       t.bitfield.imm32s = 1;
2536     }
2537   else if (fits_in_signed_long (num))
2538     {
2539       t.bitfield.imm32 = 1;
2540       t.bitfield.imm32s = 1;
2541     }
2542   else if (fits_in_unsigned_long (num))
2543     t.bitfield.imm32 = 1;
2544
2545   return t;
2546 }
2547
2548 static offsetT
2549 offset_in_range (offsetT val, int size)
2550 {
2551   addressT mask;
2552
2553   switch (size)
2554     {
2555     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2556     case 2: mask = ((addressT) 1 << 16) - 1; break;
2557     case 4: mask = ((addressT) 2 << 31) - 1; break;
2558 #ifdef BFD64
2559     case 8: mask = ((addressT) 2 << 63) - 1; break;
2560 #endif
2561     default: abort ();
2562     }
2563
2564   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2565     {
2566       char buf1[40], buf2[40];
2567
2568       sprint_value (buf1, val);
2569       sprint_value (buf2, val & mask);
2570       as_warn (_("%s shortened to %s"), buf1, buf2);
2571     }
2572   return val & mask;
2573 }
2574
2575 enum PREFIX_GROUP
2576 {
2577   PREFIX_EXIST = 0,
2578   PREFIX_LOCK,
2579   PREFIX_REP,
2580   PREFIX_DS,
2581   PREFIX_OTHER
2582 };
2583
2584 /* Returns
2585    a. PREFIX_EXIST if attempting to add a prefix where one from the
2586    same class already exists.
2587    b. PREFIX_LOCK if lock prefix is added.
2588    c. PREFIX_REP if rep/repne prefix is added.
2589    d. PREFIX_DS if ds prefix is added.
2590    e. PREFIX_OTHER if other prefix is added.
2591  */
2592
2593 static enum PREFIX_GROUP
2594 add_prefix (unsigned int prefix)
2595 {
2596   enum PREFIX_GROUP ret = PREFIX_OTHER;
2597   unsigned int q;
2598
2599   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2600       && flag_code == CODE_64BIT)
2601     {
2602       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2603           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2604           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2605           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2606         ret = PREFIX_EXIST;
2607       q = REX_PREFIX;
2608     }
2609   else
2610     {
2611       switch (prefix)
2612         {
2613         default:
2614           abort ();
2615
2616         case DS_PREFIX_OPCODE:
2617           ret = PREFIX_DS;
2618           /* Fall through.  */
2619         case CS_PREFIX_OPCODE:
2620         case ES_PREFIX_OPCODE:
2621         case FS_PREFIX_OPCODE:
2622         case GS_PREFIX_OPCODE:
2623         case SS_PREFIX_OPCODE:
2624           q = SEG_PREFIX;
2625           break;
2626
2627         case REPNE_PREFIX_OPCODE:
2628         case REPE_PREFIX_OPCODE:
2629           q = REP_PREFIX;
2630           ret = PREFIX_REP;
2631           break;
2632
2633         case LOCK_PREFIX_OPCODE:
2634           q = LOCK_PREFIX;
2635           ret = PREFIX_LOCK;
2636           break;
2637
2638         case FWAIT_OPCODE:
2639           q = WAIT_PREFIX;
2640           break;
2641
2642         case ADDR_PREFIX_OPCODE:
2643           q = ADDR_PREFIX;
2644           break;
2645
2646         case DATA_PREFIX_OPCODE:
2647           q = DATA_PREFIX;
2648           break;
2649         }
2650       if (i.prefix[q] != 0)
2651         ret = PREFIX_EXIST;
2652     }
2653
2654   if (ret)
2655     {
2656       if (!i.prefix[q])
2657         ++i.prefixes;
2658       i.prefix[q] |= prefix;
2659     }
2660   else
2661     as_bad (_("same type of prefix used twice"));
2662
2663   return ret;
2664 }
2665
2666 static void
2667 update_code_flag (int value, int check)
2668 {
2669   PRINTF_LIKE ((*as_error));
2670
2671   flag_code = (enum flag_code) value;
2672   if (flag_code == CODE_64BIT)
2673     {
2674       cpu_arch_flags.bitfield.cpu64 = 1;
2675       cpu_arch_flags.bitfield.cpuno64 = 0;
2676     }
2677   else
2678     {
2679       cpu_arch_flags.bitfield.cpu64 = 0;
2680       cpu_arch_flags.bitfield.cpuno64 = 1;
2681     }
2682   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2683     {
2684       if (check)
2685         as_error = as_fatal;
2686       else
2687         as_error = as_bad;
2688       (*as_error) (_("64bit mode not supported on `%s'."),
2689                    cpu_arch_name ? cpu_arch_name : default_arch);
2690     }
2691   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2692     {
2693       if (check)
2694         as_error = as_fatal;
2695       else
2696         as_error = as_bad;
2697       (*as_error) (_("32bit mode not supported on `%s'."),
2698                    cpu_arch_name ? cpu_arch_name : default_arch);
2699     }
2700   stackop_size = '\0';
2701 }
2702
2703 static void
2704 set_code_flag (int value)
2705 {
2706   update_code_flag (value, 0);
2707 }
2708
2709 static void
2710 set_16bit_gcc_code_flag (int new_code_flag)
2711 {
2712   flag_code = (enum flag_code) new_code_flag;
2713   if (flag_code != CODE_16BIT)
2714     abort ();
2715   cpu_arch_flags.bitfield.cpu64 = 0;
2716   cpu_arch_flags.bitfield.cpuno64 = 1;
2717   stackop_size = LONG_MNEM_SUFFIX;
2718 }
2719
2720 static void
2721 set_intel_syntax (int syntax_flag)
2722 {
2723   /* Find out if register prefixing is specified.  */
2724   int ask_naked_reg = 0;
2725
2726   SKIP_WHITESPACE ();
2727   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2728     {
2729       char *string;
2730       int e = get_symbol_name (&string);
2731
2732       if (strcmp (string, "prefix") == 0)
2733         ask_naked_reg = 1;
2734       else if (strcmp (string, "noprefix") == 0)
2735         ask_naked_reg = -1;
2736       else
2737         as_bad (_("bad argument to syntax directive."));
2738       (void) restore_line_pointer (e);
2739     }
2740   demand_empty_rest_of_line ();
2741
2742   intel_syntax = syntax_flag;
2743
2744   if (ask_naked_reg == 0)
2745     allow_naked_reg = (intel_syntax
2746                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2747   else
2748     allow_naked_reg = (ask_naked_reg < 0);
2749
2750   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2751
2752   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2753   identifier_chars['$'] = intel_syntax ? '$' : 0;
2754   register_prefix = allow_naked_reg ? "" : "%";
2755 }
2756
2757 static void
2758 set_intel_mnemonic (int mnemonic_flag)
2759 {
2760   intel_mnemonic = mnemonic_flag;
2761 }
2762
2763 static void
2764 set_allow_index_reg (int flag)
2765 {
2766   allow_index_reg = flag;
2767 }
2768
2769 static void
2770 set_check (int what)
2771 {
2772   enum check_kind *kind;
2773   const char *str;
2774
2775   if (what)
2776     {
2777       kind = &operand_check;
2778       str = "operand";
2779     }
2780   else
2781     {
2782       kind = &sse_check;
2783       str = "sse";
2784     }
2785
2786   SKIP_WHITESPACE ();
2787
2788   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2789     {
2790       char *string;
2791       int e = get_symbol_name (&string);
2792
2793       if (strcmp (string, "none") == 0)
2794         *kind = check_none;
2795       else if (strcmp (string, "warning") == 0)
2796         *kind = check_warning;
2797       else if (strcmp (string, "error") == 0)
2798         *kind = check_error;
2799       else
2800         as_bad (_("bad argument to %s_check directive."), str);
2801       (void) restore_line_pointer (e);
2802     }
2803   else
2804     as_bad (_("missing argument for %s_check directive"), str);
2805
2806   demand_empty_rest_of_line ();
2807 }
2808
2809 static void
2810 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2811                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2812 {
2813 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2814   static const char *arch;
2815
2816   /* Intel LIOM is only supported on ELF.  */
2817   if (!IS_ELF)
2818     return;
2819
2820   if (!arch)
2821     {
2822       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2823          use default_arch.  */
2824       arch = cpu_arch_name;
2825       if (!arch)
2826         arch = default_arch;
2827     }
2828
2829   /* If we are targeting Intel MCU, we must enable it.  */
2830   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2831       || new_flag.bitfield.cpuiamcu)
2832     return;
2833
2834   /* If we are targeting Intel L1OM, we must enable it.  */
2835   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2836       || new_flag.bitfield.cpul1om)
2837     return;
2838
2839   /* If we are targeting Intel K1OM, we must enable it.  */
2840   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2841       || new_flag.bitfield.cpuk1om)
2842     return;
2843
2844   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2845 #endif
2846 }
2847
2848 static void
2849 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2850 {
2851   SKIP_WHITESPACE ();
2852
2853   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2854     {
2855       char *string;
2856       int e = get_symbol_name (&string);
2857       unsigned int j;
2858       i386_cpu_flags flags;
2859
2860       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2861         {
2862           if (strcmp (string, cpu_arch[j].name) == 0)
2863             {
2864               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2865
2866               if (*string != '.')
2867                 {
2868                   cpu_arch_name = cpu_arch[j].name;
2869                   cpu_sub_arch_name = NULL;
2870                   cpu_arch_flags = cpu_arch[j].flags;
2871                   if (flag_code == CODE_64BIT)
2872                     {
2873                       cpu_arch_flags.bitfield.cpu64 = 1;
2874                       cpu_arch_flags.bitfield.cpuno64 = 0;
2875                     }
2876                   else
2877                     {
2878                       cpu_arch_flags.bitfield.cpu64 = 0;
2879                       cpu_arch_flags.bitfield.cpuno64 = 1;
2880                     }
2881                   cpu_arch_isa = cpu_arch[j].type;
2882                   cpu_arch_isa_flags = cpu_arch[j].flags;
2883                   if (!cpu_arch_tune_set)
2884                     {
2885                       cpu_arch_tune = cpu_arch_isa;
2886                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2887                     }
2888                   break;
2889                 }
2890
2891               flags = cpu_flags_or (cpu_arch_flags,
2892                                     cpu_arch[j].flags);
2893
2894               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2895                 {
2896                   if (cpu_sub_arch_name)
2897                     {
2898                       char *name = cpu_sub_arch_name;
2899                       cpu_sub_arch_name = concat (name,
2900                                                   cpu_arch[j].name,
2901                                                   (const char *) NULL);
2902                       free (name);
2903                     }
2904                   else
2905                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2906                   cpu_arch_flags = flags;
2907                   cpu_arch_isa_flags = flags;
2908                 }
2909               else
2910                 cpu_arch_isa_flags
2911                   = cpu_flags_or (cpu_arch_isa_flags,
2912                                   cpu_arch[j].flags);
2913               (void) restore_line_pointer (e);
2914               demand_empty_rest_of_line ();
2915               return;
2916             }
2917         }
2918
2919       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2920         {
2921           /* Disable an ISA extension.  */
2922           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2923             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2924               {
2925                 flags = cpu_flags_and_not (cpu_arch_flags,
2926                                            cpu_noarch[j].flags);
2927                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2928                   {
2929                     if (cpu_sub_arch_name)
2930                       {
2931                         char *name = cpu_sub_arch_name;
2932                         cpu_sub_arch_name = concat (name, string,
2933                                                     (const char *) NULL);
2934                         free (name);
2935                       }
2936                     else
2937                       cpu_sub_arch_name = xstrdup (string);
2938                     cpu_arch_flags = flags;
2939                     cpu_arch_isa_flags = flags;
2940                   }
2941                 (void) restore_line_pointer (e);
2942                 demand_empty_rest_of_line ();
2943                 return;
2944               }
2945
2946           j = ARRAY_SIZE (cpu_arch);
2947         }
2948
2949       if (j >= ARRAY_SIZE (cpu_arch))
2950         as_bad (_("no such architecture: `%s'"), string);
2951
2952       *input_line_pointer = e;
2953     }
2954   else
2955     as_bad (_("missing cpu architecture"));
2956
2957   no_cond_jump_promotion = 0;
2958   if (*input_line_pointer == ','
2959       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2960     {
2961       char *string;
2962       char e;
2963
2964       ++input_line_pointer;
2965       e = get_symbol_name (&string);
2966
2967       if (strcmp (string, "nojumps") == 0)
2968         no_cond_jump_promotion = 1;
2969       else if (strcmp (string, "jumps") == 0)
2970         ;
2971       else
2972         as_bad (_("no such architecture modifier: `%s'"), string);
2973
2974       (void) restore_line_pointer (e);
2975     }
2976
2977   demand_empty_rest_of_line ();
2978 }
2979
2980 enum bfd_architecture
2981 i386_arch (void)
2982 {
2983   if (cpu_arch_isa == PROCESSOR_L1OM)
2984     {
2985       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986           || flag_code != CODE_64BIT)
2987         as_fatal (_("Intel L1OM is 64bit ELF only"));
2988       return bfd_arch_l1om;
2989     }
2990   else if (cpu_arch_isa == PROCESSOR_K1OM)
2991     {
2992       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993           || flag_code != CODE_64BIT)
2994         as_fatal (_("Intel K1OM is 64bit ELF only"));
2995       return bfd_arch_k1om;
2996     }
2997   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2998     {
2999       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3000           || flag_code == CODE_64BIT)
3001         as_fatal (_("Intel MCU is 32bit ELF only"));
3002       return bfd_arch_iamcu;
3003     }
3004   else
3005     return bfd_arch_i386;
3006 }
3007
3008 unsigned long
3009 i386_mach (void)
3010 {
3011   if (!strncmp (default_arch, "x86_64", 6))
3012     {
3013       if (cpu_arch_isa == PROCESSOR_L1OM)
3014         {
3015           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3016               || default_arch[6] != '\0')
3017             as_fatal (_("Intel L1OM is 64bit ELF only"));
3018           return bfd_mach_l1om;
3019         }
3020       else if (cpu_arch_isa == PROCESSOR_K1OM)
3021         {
3022           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3023               || default_arch[6] != '\0')
3024             as_fatal (_("Intel K1OM is 64bit ELF only"));
3025           return bfd_mach_k1om;
3026         }
3027       else if (default_arch[6] == '\0')
3028         return bfd_mach_x86_64;
3029       else
3030         return bfd_mach_x64_32;
3031     }
3032   else if (!strcmp (default_arch, "i386")
3033            || !strcmp (default_arch, "iamcu"))
3034     {
3035       if (cpu_arch_isa == PROCESSOR_IAMCU)
3036         {
3037           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3038             as_fatal (_("Intel MCU is 32bit ELF only"));
3039           return bfd_mach_i386_iamcu;
3040         }
3041       else
3042         return bfd_mach_i386_i386;
3043     }
3044   else
3045     as_fatal (_("unknown architecture"));
3046 }
3047 \f
3048 void
3049 md_begin (void)
3050 {
3051   /* Support pseudo prefixes like {disp32}.  */
3052   lex_type ['{'] = LEX_BEGIN_NAME;
3053
3054   /* Initialize op_hash hash table.  */
3055   op_hash = str_htab_create ();
3056
3057   {
3058     const insn_template *optab;
3059     templates *core_optab;
3060
3061     /* Setup for loop.  */
3062     optab = i386_optab;
3063     core_optab = XNEW (templates);
3064     core_optab->start = optab;
3065
3066     while (1)
3067       {
3068         ++optab;
3069         if (optab->name == NULL
3070             || strcmp (optab->name, (optab - 1)->name) != 0)
3071           {
3072             /* different name --> ship out current template list;
3073                add to hash table; & begin anew.  */
3074             core_optab->end = optab;
3075             if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3076               as_fatal (_("duplicate %s"), (optab - 1)->name);
3077
3078             if (optab->name == NULL)
3079               break;
3080             core_optab = XNEW (templates);
3081             core_optab->start = optab;
3082           }
3083       }
3084   }
3085
3086   /* Initialize reg_hash hash table.  */
3087   reg_hash = str_htab_create ();
3088   {
3089     const reg_entry *regtab;
3090     unsigned int regtab_size = i386_regtab_size;
3091
3092     for (regtab = i386_regtab; regtab_size--; regtab++)
3093       if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3094         as_fatal (_("duplicate %s"), regtab->reg_name);
3095   }
3096
3097   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3098   {
3099     int c;
3100     char *p;
3101
3102     for (c = 0; c < 256; c++)
3103       {
3104         if (ISDIGIT (c))
3105           {
3106             digit_chars[c] = c;
3107             mnemonic_chars[c] = c;
3108             register_chars[c] = c;
3109             operand_chars[c] = c;
3110           }
3111         else if (ISLOWER (c))
3112           {
3113             mnemonic_chars[c] = c;
3114             register_chars[c] = c;
3115             operand_chars[c] = c;
3116           }
3117         else if (ISUPPER (c))
3118           {
3119             mnemonic_chars[c] = TOLOWER (c);
3120             register_chars[c] = mnemonic_chars[c];
3121             operand_chars[c] = c;
3122           }
3123         else if (c == '{' || c == '}')
3124           {
3125             mnemonic_chars[c] = c;
3126             operand_chars[c] = c;
3127           }
3128 #ifdef SVR4_COMMENT_CHARS
3129         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3130           operand_chars[c] = c;
3131 #endif
3132
3133         if (ISALPHA (c) || ISDIGIT (c))
3134           identifier_chars[c] = c;
3135         else if (c >= 128)
3136           {
3137             identifier_chars[c] = c;
3138             operand_chars[c] = c;
3139           }
3140       }
3141
3142 #ifdef LEX_AT
3143     identifier_chars['@'] = '@';
3144 #endif
3145 #ifdef LEX_QM
3146     identifier_chars['?'] = '?';
3147     operand_chars['?'] = '?';
3148 #endif
3149     digit_chars['-'] = '-';
3150     mnemonic_chars['_'] = '_';
3151     mnemonic_chars['-'] = '-';
3152     mnemonic_chars['.'] = '.';
3153     identifier_chars['_'] = '_';
3154     identifier_chars['.'] = '.';
3155
3156     for (p = operand_special_chars; *p != '\0'; p++)
3157       operand_chars[(unsigned char) *p] = *p;
3158   }
3159
3160   if (flag_code == CODE_64BIT)
3161     {
3162 #if defined (OBJ_COFF) && defined (TE_PE)
3163       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3164                                   ? 32 : 16);
3165 #else
3166       x86_dwarf2_return_column = 16;
3167 #endif
3168       x86_cie_data_alignment = -8;
3169     }
3170   else
3171     {
3172       x86_dwarf2_return_column = 8;
3173       x86_cie_data_alignment = -4;
3174     }
3175
3176   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3177      can be turned into BRANCH_PREFIX frag.  */
3178   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3179     abort ();
3180 }
3181
3182 void
3183 i386_print_statistics (FILE *file)
3184 {
3185   htab_print_statistics (file, "i386 opcode", op_hash);
3186   htab_print_statistics (file, "i386 register", reg_hash);
3187 }
3188 \f
3189 #ifdef DEBUG386
3190
3191 /* Debugging routines for md_assemble.  */
3192 static void pte (insn_template *);
3193 static void pt (i386_operand_type);
3194 static void pe (expressionS *);
3195 static void ps (symbolS *);
3196
3197 static void
3198 pi (const char *line, i386_insn *x)
3199 {
3200   unsigned int j;
3201
3202   fprintf (stdout, "%s: template ", line);
3203   pte (&x->tm);
3204   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3205            x->base_reg ? x->base_reg->reg_name : "none",
3206            x->index_reg ? x->index_reg->reg_name : "none",
3207            x->log2_scale_factor);
3208   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3209            x->rm.mode, x->rm.reg, x->rm.regmem);
3210   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3211            x->sib.base, x->sib.index, x->sib.scale);
3212   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3213            (x->rex & REX_W) != 0,
3214            (x->rex & REX_R) != 0,
3215            (x->rex & REX_X) != 0,
3216            (x->rex & REX_B) != 0);
3217   for (j = 0; j < x->operands; j++)
3218     {
3219       fprintf (stdout, "    #%d:  ", j + 1);
3220       pt (x->types[j]);
3221       fprintf (stdout, "\n");
3222       if (x->types[j].bitfield.class == Reg
3223           || x->types[j].bitfield.class == RegMMX
3224           || x->types[j].bitfield.class == RegSIMD
3225           || x->types[j].bitfield.class == RegMask
3226           || x->types[j].bitfield.class == SReg
3227           || x->types[j].bitfield.class == RegCR
3228           || x->types[j].bitfield.class == RegDR
3229           || x->types[j].bitfield.class == RegTR
3230           || x->types[j].bitfield.class == RegBND)
3231         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3232       if (operand_type_check (x->types[j], imm))
3233         pe (x->op[j].imms);
3234       if (operand_type_check (x->types[j], disp))
3235         pe (x->op[j].disps);
3236     }
3237 }
3238
3239 static void
3240 pte (insn_template *t)
3241 {
3242   static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
3243   static const char *const opc_spc[] = {
3244     NULL, "0f", "0f38", "0f3a", NULL, NULL, NULL, NULL,
3245     "XOP08", "XOP09", "XOP0A",
3246   };
3247   unsigned int j;
3248
3249   fprintf (stdout, " %d operands ", t->operands);
3250   if (opc_pfx[t->opcode_modifier.opcodeprefix])
3251     fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
3252   if (opc_spc[t->opcode_modifier.opcodespace])
3253     fprintf (stdout, "space %s ", opc_spc[t->opcode_modifier.opcodespace]);
3254   fprintf (stdout, "opcode %x ", t->base_opcode);
3255   if (t->extension_opcode != None)
3256     fprintf (stdout, "ext %x ", t->extension_opcode);
3257   if (t->opcode_modifier.d)
3258     fprintf (stdout, "D");
3259   if (t->opcode_modifier.w)
3260     fprintf (stdout, "W");
3261   fprintf (stdout, "\n");
3262   for (j = 0; j < t->operands; j++)
3263     {
3264       fprintf (stdout, "    #%d type ", j + 1);
3265       pt (t->operand_types[j]);
3266       fprintf (stdout, "\n");
3267     }
3268 }
3269
3270 static void
3271 pe (expressionS *e)
3272 {
3273   fprintf (stdout, "    operation     %d\n", e->X_op);
3274   fprintf (stdout, "    add_number    %ld (%lx)\n",
3275            (long) e->X_add_number, (long) e->X_add_number);
3276   if (e->X_add_symbol)
3277     {
3278       fprintf (stdout, "    add_symbol    ");
3279       ps (e->X_add_symbol);
3280       fprintf (stdout, "\n");
3281     }
3282   if (e->X_op_symbol)
3283     {
3284       fprintf (stdout, "    op_symbol    ");
3285       ps (e->X_op_symbol);
3286       fprintf (stdout, "\n");
3287     }
3288 }
3289
3290 static void
3291 ps (symbolS *s)
3292 {
3293   fprintf (stdout, "%s type %s%s",
3294            S_GET_NAME (s),
3295            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3296            segment_name (S_GET_SEGMENT (s)));
3297 }
3298
3299 static struct type_name
3300   {
3301     i386_operand_type mask;
3302     const char *name;
3303   }
3304 const type_names[] =
3305 {
3306   { OPERAND_TYPE_REG8, "r8" },
3307   { OPERAND_TYPE_REG16, "r16" },
3308   { OPERAND_TYPE_REG32, "r32" },
3309   { OPERAND_TYPE_REG64, "r64" },
3310   { OPERAND_TYPE_ACC8, "acc8" },
3311   { OPERAND_TYPE_ACC16, "acc16" },
3312   { OPERAND_TYPE_ACC32, "acc32" },
3313   { OPERAND_TYPE_ACC64, "acc64" },
3314   { OPERAND_TYPE_IMM8, "i8" },
3315   { OPERAND_TYPE_IMM8, "i8s" },
3316   { OPERAND_TYPE_IMM16, "i16" },
3317   { OPERAND_TYPE_IMM32, "i32" },
3318   { OPERAND_TYPE_IMM32S, "i32s" },
3319   { OPERAND_TYPE_IMM64, "i64" },
3320   { OPERAND_TYPE_IMM1, "i1" },
3321   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3322   { OPERAND_TYPE_DISP8, "d8" },
3323   { OPERAND_TYPE_DISP16, "d16" },
3324   { OPERAND_TYPE_DISP32, "d32" },
3325   { OPERAND_TYPE_DISP32S, "d32s" },
3326   { OPERAND_TYPE_DISP64, "d64" },
3327   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3328   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3329   { OPERAND_TYPE_CONTROL, "control reg" },
3330   { OPERAND_TYPE_TEST, "test reg" },
3331   { OPERAND_TYPE_DEBUG, "debug reg" },
3332   { OPERAND_TYPE_FLOATREG, "FReg" },
3333   { OPERAND_TYPE_FLOATACC, "FAcc" },
3334   { OPERAND_TYPE_SREG, "SReg" },
3335   { OPERAND_TYPE_REGMMX, "rMMX" },
3336   { OPERAND_TYPE_REGXMM, "rXMM" },
3337   { OPERAND_TYPE_REGYMM, "rYMM" },
3338   { OPERAND_TYPE_REGZMM, "rZMM" },
3339   { OPERAND_TYPE_REGTMM, "rTMM" },
3340   { OPERAND_TYPE_REGMASK, "Mask reg" },
3341 };
3342
3343 static void
3344 pt (i386_operand_type t)
3345 {
3346   unsigned int j;
3347   i386_operand_type a;
3348
3349   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3350     {
3351       a = operand_type_and (t, type_names[j].mask);
3352       if (operand_type_equal (&a, &type_names[j].mask))
3353         fprintf (stdout, "%s, ",  type_names[j].name);
3354     }
3355   fflush (stdout);
3356 }
3357
3358 #endif /* DEBUG386 */
3359 \f
3360 static bfd_reloc_code_real_type
3361 reloc (unsigned int size,
3362        int pcrel,
3363        int sign,
3364        bfd_reloc_code_real_type other)
3365 {
3366   if (other != NO_RELOC)
3367     {
3368       reloc_howto_type *rel;
3369
3370       if (size == 8)
3371         switch (other)
3372           {
3373           case BFD_RELOC_X86_64_GOT32:
3374             return BFD_RELOC_X86_64_GOT64;
3375             break;
3376           case BFD_RELOC_X86_64_GOTPLT64:
3377             return BFD_RELOC_X86_64_GOTPLT64;
3378             break;
3379           case BFD_RELOC_X86_64_PLTOFF64:
3380             return BFD_RELOC_X86_64_PLTOFF64;
3381             break;
3382           case BFD_RELOC_X86_64_GOTPC32:
3383             other = BFD_RELOC_X86_64_GOTPC64;
3384             break;
3385           case BFD_RELOC_X86_64_GOTPCREL:
3386             other = BFD_RELOC_X86_64_GOTPCREL64;
3387             break;
3388           case BFD_RELOC_X86_64_TPOFF32:
3389             other = BFD_RELOC_X86_64_TPOFF64;
3390             break;
3391           case BFD_RELOC_X86_64_DTPOFF32:
3392             other = BFD_RELOC_X86_64_DTPOFF64;
3393             break;
3394           default:
3395             break;
3396           }
3397
3398 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3399       if (other == BFD_RELOC_SIZE32)
3400         {
3401           if (size == 8)
3402             other = BFD_RELOC_SIZE64;
3403           if (pcrel)
3404             {
3405               as_bad (_("there are no pc-relative size relocations"));
3406               return NO_RELOC;
3407             }
3408         }
3409 #endif
3410
3411       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3412       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3413         sign = -1;
3414
3415       rel = bfd_reloc_type_lookup (stdoutput, other);
3416       if (!rel)
3417         as_bad (_("unknown relocation (%u)"), other);
3418       else if (size != bfd_get_reloc_size (rel))
3419         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3420                 bfd_get_reloc_size (rel),
3421                 size);
3422       else if (pcrel && !rel->pc_relative)
3423         as_bad (_("non-pc-relative relocation for pc-relative field"));
3424       else if ((rel->complain_on_overflow == complain_overflow_signed
3425                 && !sign)
3426                || (rel->complain_on_overflow == complain_overflow_unsigned
3427                    && sign > 0))
3428         as_bad (_("relocated field and relocation type differ in signedness"));
3429       else
3430         return other;
3431       return NO_RELOC;
3432     }
3433
3434   if (pcrel)
3435     {
3436       if (!sign)
3437         as_bad (_("there are no unsigned pc-relative relocations"));
3438       switch (size)
3439         {
3440         case 1: return BFD_RELOC_8_PCREL;
3441         case 2: return BFD_RELOC_16_PCREL;
3442         case 4: return BFD_RELOC_32_PCREL;
3443         case 8: return BFD_RELOC_64_PCREL;
3444         }
3445       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3446     }
3447   else
3448     {
3449       if (sign > 0)
3450         switch (size)
3451           {
3452           case 4: return BFD_RELOC_X86_64_32S;
3453           }
3454       else
3455         switch (size)
3456           {
3457           case 1: return BFD_RELOC_8;
3458           case 2: return BFD_RELOC_16;
3459           case 4: return BFD_RELOC_32;
3460           case 8: return BFD_RELOC_64;
3461           }
3462       as_bad (_("cannot do %s %u byte relocation"),
3463               sign > 0 ? "signed" : "unsigned", size);
3464     }
3465
3466   return NO_RELOC;
3467 }
3468
3469 /* Here we decide which fixups can be adjusted to make them relative to
3470    the beginning of the section instead of the symbol.  Basically we need
3471    to make sure that the dynamic relocations are done correctly, so in
3472    some cases we force the original symbol to be used.  */
3473
3474 int
3475 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3476 {
3477 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3478   if (!IS_ELF)
3479     return 1;
3480
3481   /* Don't adjust pc-relative references to merge sections in 64-bit
3482      mode.  */
3483   if (use_rela_relocations
3484       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3485       && fixP->fx_pcrel)
3486     return 0;
3487
3488   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3489      and changed later by validate_fix.  */
3490   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3491       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3492     return 0;
3493
3494   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3495      for size relocations.  */
3496   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3497       || fixP->fx_r_type == BFD_RELOC_SIZE64
3498       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3499       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3500       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3501       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3502       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3503       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3504       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3505       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3506       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3507       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3508       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3509       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3510       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3511       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3512       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3513       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3514       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3515       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3516       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3517       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3518       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3519       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3520       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3521       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3522       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3523       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3524       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3525       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3526       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3527     return 0;
3528 #endif
3529   return 1;
3530 }
3531
3532 static int
3533 intel_float_operand (const char *mnemonic)
3534 {
3535   /* Note that the value returned is meaningful only for opcodes with (memory)
3536      operands, hence the code here is free to improperly handle opcodes that
3537      have no operands (for better performance and smaller code). */
3538
3539   if (mnemonic[0] != 'f')
3540     return 0; /* non-math */
3541
3542   switch (mnemonic[1])
3543     {
3544     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3545        the fs segment override prefix not currently handled because no
3546        call path can make opcodes without operands get here */
3547     case 'i':
3548       return 2 /* integer op */;
3549     case 'l':
3550       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3551         return 3; /* fldcw/fldenv */
3552       break;
3553     case 'n':
3554       if (mnemonic[2] != 'o' /* fnop */)
3555         return 3; /* non-waiting control op */
3556       break;
3557     case 'r':
3558       if (mnemonic[2] == 's')
3559         return 3; /* frstor/frstpm */
3560       break;
3561     case 's':
3562       if (mnemonic[2] == 'a')
3563         return 3; /* fsave */
3564       if (mnemonic[2] == 't')
3565         {
3566           switch (mnemonic[3])
3567             {
3568             case 'c': /* fstcw */
3569             case 'd': /* fstdw */
3570             case 'e': /* fstenv */
3571             case 's': /* fsts[gw] */
3572               return 3;
3573             }
3574         }
3575       break;
3576     case 'x':
3577       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3578         return 0; /* fxsave/fxrstor are not really math ops */
3579       break;
3580     }
3581
3582   return 1;
3583 }
3584
3585 /* Build the VEX prefix.  */
3586
3587 static void
3588 build_vex_prefix (const insn_template *t)
3589 {
3590   unsigned int register_specifier;
3591   unsigned int implied_prefix;
3592   unsigned int vector_length;
3593   unsigned int w;
3594
3595   /* Check register specifier.  */
3596   if (i.vex.register_specifier)
3597     {
3598       register_specifier =
3599         ~register_number (i.vex.register_specifier) & 0xf;
3600       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3601     }
3602   else
3603     register_specifier = 0xf;
3604
3605   /* Use 2-byte VEX prefix by swapping destination and source operand
3606      if there are more than 1 register operand.  */
3607   if (i.reg_operands > 1
3608       && i.vec_encoding != vex_encoding_vex3
3609       && i.dir_encoding == dir_encoding_default
3610       && i.operands == i.reg_operands
3611       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3612       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3613       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3614       && i.rex == REX_B)
3615     {
3616       unsigned int xchg = i.operands - 1;
3617       union i386_op temp_op;
3618       i386_operand_type temp_type;
3619
3620       temp_type = i.types[xchg];
3621       i.types[xchg] = i.types[0];
3622       i.types[0] = temp_type;
3623       temp_op = i.op[xchg];
3624       i.op[xchg] = i.op[0];
3625       i.op[0] = temp_op;
3626
3627       gas_assert (i.rm.mode == 3);
3628
3629       i.rex = REX_R;
3630       xchg = i.rm.regmem;
3631       i.rm.regmem = i.rm.reg;
3632       i.rm.reg = xchg;
3633
3634       if (i.tm.opcode_modifier.d)
3635         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3636                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3637       else /* Use the next insn.  */
3638         i.tm = t[1];
3639     }
3640
3641   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3642      are no memory operands and at least 3 register ones.  */
3643   if (i.reg_operands >= 3
3644       && i.vec_encoding != vex_encoding_vex3
3645       && i.reg_operands == i.operands - i.imm_operands
3646       && i.tm.opcode_modifier.vex
3647       && i.tm.opcode_modifier.commutative
3648       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3649       && i.rex == REX_B
3650       && i.vex.register_specifier
3651       && !(i.vex.register_specifier->reg_flags & RegRex))
3652     {
3653       unsigned int xchg = i.operands - i.reg_operands;
3654       union i386_op temp_op;
3655       i386_operand_type temp_type;
3656
3657       gas_assert (i.tm.opcode_modifier.opcodespace == SPACE_0F);
3658       gas_assert (!i.tm.opcode_modifier.sae);
3659       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3660                                       &i.types[i.operands - 3]));
3661       gas_assert (i.rm.mode == 3);
3662
3663       temp_type = i.types[xchg];
3664       i.types[xchg] = i.types[xchg + 1];
3665       i.types[xchg + 1] = temp_type;
3666       temp_op = i.op[xchg];
3667       i.op[xchg] = i.op[xchg + 1];
3668       i.op[xchg + 1] = temp_op;
3669
3670       i.rex = 0;
3671       xchg = i.rm.regmem | 8;
3672       i.rm.regmem = ~register_specifier & 0xf;
3673       gas_assert (!(i.rm.regmem & 8));
3674       i.vex.register_specifier += xchg - i.rm.regmem;
3675       register_specifier = ~xchg & 0xf;
3676     }
3677
3678   if (i.tm.opcode_modifier.vex == VEXScalar)
3679     vector_length = avxscalar;
3680   else if (i.tm.opcode_modifier.vex == VEX256)
3681     vector_length = 1;
3682   else
3683     {
3684       unsigned int op;
3685
3686       /* Determine vector length from the last multi-length vector
3687          operand.  */
3688       vector_length = 0;
3689       for (op = t->operands; op--;)
3690         if (t->operand_types[op].bitfield.xmmword
3691             && t->operand_types[op].bitfield.ymmword
3692             && i.types[op].bitfield.ymmword)
3693           {
3694             vector_length = 1;
3695             break;
3696           }
3697     }
3698
3699   switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
3700     {
3701     case 0:
3702       implied_prefix = 0;
3703       break;
3704     case DATA_PREFIX_OPCODE:
3705       implied_prefix = 1;
3706       break;
3707     case REPE_PREFIX_OPCODE:
3708       implied_prefix = 2;
3709       break;
3710     case REPNE_PREFIX_OPCODE:
3711       implied_prefix = 3;
3712       break;
3713     default:
3714       abort ();
3715     }
3716
3717   /* Check the REX.W bit and VEXW.  */
3718   if (i.tm.opcode_modifier.vexw == VEXWIG)
3719     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3720   else if (i.tm.opcode_modifier.vexw)
3721     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3722   else
3723     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3724
3725   /* Use 2-byte VEX prefix if possible.  */
3726   if (w == 0
3727       && i.vec_encoding != vex_encoding_vex3
3728       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3729       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3730     {
3731       /* 2-byte VEX prefix.  */
3732       unsigned int r;
3733
3734       i.vex.length = 2;
3735       i.vex.bytes[0] = 0xc5;
3736
3737       /* Check the REX.R bit.  */
3738       r = (i.rex & REX_R) ? 0 : 1;
3739       i.vex.bytes[1] = (r << 7
3740                         | register_specifier << 3
3741                         | vector_length << 2
3742                         | implied_prefix);
3743     }
3744   else
3745     {
3746       /* 3-byte VEX prefix.  */
3747       i.vex.length = 3;
3748
3749       switch (i.tm.opcode_modifier.opcodespace)
3750         {
3751         case SPACE_0F:
3752         case SPACE_0F38:
3753         case SPACE_0F3A:
3754           i.vex.bytes[0] = 0xc4;
3755           break;
3756         case SPACE_XOP08:
3757         case SPACE_XOP09:
3758         case SPACE_XOP0A:
3759           i.vex.bytes[0] = 0x8f;
3760           break;
3761         default:
3762           abort ();
3763         }
3764
3765       /* The high 3 bits of the second VEX byte are 1's compliment
3766          of RXB bits from REX.  */
3767       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3768
3769       i.vex.bytes[2] = (w << 7
3770                         | register_specifier << 3
3771                         | vector_length << 2
3772                         | implied_prefix);
3773     }
3774 }
3775
3776 static INLINE bfd_boolean
3777 is_evex_encoding (const insn_template *t)
3778 {
3779   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3780          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3781          || t->opcode_modifier.sae;
3782 }
3783
3784 static INLINE bfd_boolean
3785 is_any_vex_encoding (const insn_template *t)
3786 {
3787   return t->opcode_modifier.vex || is_evex_encoding (t);
3788 }
3789
3790 /* Build the EVEX prefix.  */
3791
3792 static void
3793 build_evex_prefix (void)
3794 {
3795   unsigned int register_specifier;
3796   unsigned int implied_prefix, w;
3797   rex_byte vrex_used = 0;
3798
3799   /* Check register specifier.  */
3800   if (i.vex.register_specifier)
3801     {
3802       gas_assert ((i.vrex & REX_X) == 0);
3803
3804       register_specifier = i.vex.register_specifier->reg_num;
3805       if ((i.vex.register_specifier->reg_flags & RegRex))
3806         register_specifier += 8;
3807       /* The upper 16 registers are encoded in the fourth byte of the
3808          EVEX prefix.  */
3809       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3810         i.vex.bytes[3] = 0x8;
3811       register_specifier = ~register_specifier & 0xf;
3812     }
3813   else
3814     {
3815       register_specifier = 0xf;
3816
3817       /* Encode upper 16 vector index register in the fourth byte of
3818          the EVEX prefix.  */
3819       if (!(i.vrex & REX_X))
3820         i.vex.bytes[3] = 0x8;
3821       else
3822         vrex_used |= REX_X;
3823     }
3824
3825   switch ((i.tm.base_opcode >> 8) & 0xff)
3826     {
3827     case 0:
3828       implied_prefix = 0;
3829       break;
3830     case DATA_PREFIX_OPCODE:
3831       implied_prefix = 1;
3832       break;
3833     case REPE_PREFIX_OPCODE:
3834       implied_prefix = 2;
3835       break;
3836     case REPNE_PREFIX_OPCODE:
3837       implied_prefix = 3;
3838       break;
3839     default:
3840       abort ();
3841     }
3842
3843   /* 4 byte EVEX prefix.  */
3844   i.vex.length = 4;
3845   i.vex.bytes[0] = 0x62;
3846
3847   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3848      bits from REX.  */
3849   gas_assert (i.tm.opcode_modifier.opcodespace >= SPACE_0F);
3850   gas_assert (i.tm.opcode_modifier.opcodespace <= SPACE_0F3A);
3851   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3852
3853   /* The fifth bit of the second EVEX byte is 1's compliment of the
3854      REX_R bit in VREX.  */
3855   if (!(i.vrex & REX_R))
3856     i.vex.bytes[1] |= 0x10;
3857   else
3858     vrex_used |= REX_R;
3859
3860   if ((i.reg_operands + i.imm_operands) == i.operands)
3861     {
3862       /* When all operands are registers, the REX_X bit in REX is not
3863          used.  We reuse it to encode the upper 16 registers, which is
3864          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3865          as 1's compliment.  */
3866       if ((i.vrex & REX_B))
3867         {
3868           vrex_used |= REX_B;
3869           i.vex.bytes[1] &= ~0x40;
3870         }
3871     }
3872
3873   /* EVEX instructions shouldn't need the REX prefix.  */
3874   i.vrex &= ~vrex_used;
3875   gas_assert (i.vrex == 0);
3876
3877   /* Check the REX.W bit and VEXW.  */
3878   if (i.tm.opcode_modifier.vexw == VEXWIG)
3879     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3880   else if (i.tm.opcode_modifier.vexw)
3881     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3882   else
3883     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3884
3885   /* Encode the U bit.  */
3886   implied_prefix |= 0x4;
3887
3888   /* The third byte of the EVEX prefix.  */
3889   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3890
3891   /* The fourth byte of the EVEX prefix.  */
3892   /* The zeroing-masking bit.  */
3893   if (i.mask && i.mask->zeroing)
3894     i.vex.bytes[3] |= 0x80;
3895
3896   /* Don't always set the broadcast bit if there is no RC.  */
3897   if (!i.rounding)
3898     {
3899       /* Encode the vector length.  */
3900       unsigned int vec_length;
3901
3902       if (!i.tm.opcode_modifier.evex
3903           || i.tm.opcode_modifier.evex == EVEXDYN)
3904         {
3905           unsigned int op;
3906
3907           /* Determine vector length from the last multi-length vector
3908              operand.  */
3909           for (op = i.operands; op--;)
3910             if (i.tm.operand_types[op].bitfield.xmmword
3911                 + i.tm.operand_types[op].bitfield.ymmword
3912                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3913               {
3914                 if (i.types[op].bitfield.zmmword)
3915                   {
3916                     i.tm.opcode_modifier.evex = EVEX512;
3917                     break;
3918                   }
3919                 else if (i.types[op].bitfield.ymmword)
3920                   {
3921                     i.tm.opcode_modifier.evex = EVEX256;
3922                     break;
3923                   }
3924                 else if (i.types[op].bitfield.xmmword)
3925                   {
3926                     i.tm.opcode_modifier.evex = EVEX128;
3927                     break;
3928                   }
3929                 else if (i.broadcast && (int) op == i.broadcast->operand)
3930                   {
3931                     switch (i.broadcast->bytes)
3932                       {
3933                         case 64:
3934                           i.tm.opcode_modifier.evex = EVEX512;
3935                           break;
3936                         case 32:
3937                           i.tm.opcode_modifier.evex = EVEX256;
3938                           break;
3939                         case 16:
3940                           i.tm.opcode_modifier.evex = EVEX128;
3941                           break;
3942                         default:
3943                           abort ();
3944                       }
3945                     break;
3946                   }
3947               }
3948
3949           if (op >= MAX_OPERANDS)
3950             abort ();
3951         }
3952
3953       switch (i.tm.opcode_modifier.evex)
3954         {
3955         case EVEXLIG: /* LL' is ignored */
3956           vec_length = evexlig << 5;
3957           break;
3958         case EVEX128:
3959           vec_length = 0 << 5;
3960           break;
3961         case EVEX256:
3962           vec_length = 1 << 5;
3963           break;
3964         case EVEX512:
3965           vec_length = 2 << 5;
3966           break;
3967         default:
3968           abort ();
3969           break;
3970         }
3971       i.vex.bytes[3] |= vec_length;
3972       /* Encode the broadcast bit.  */
3973       if (i.broadcast)
3974         i.vex.bytes[3] |= 0x10;
3975     }
3976   else
3977     {
3978       if (i.rounding->type != saeonly)
3979         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3980       else
3981         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3982     }
3983
3984   if (i.mask && i.mask->mask)
3985     i.vex.bytes[3] |= i.mask->mask->reg_num;
3986 }
3987
3988 static void
3989 process_immext (void)
3990 {
3991   expressionS *exp;
3992
3993   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3994      which is coded in the same place as an 8-bit immediate field
3995      would be.  Here we fake an 8-bit immediate operand from the
3996      opcode suffix stored in tm.extension_opcode.
3997
3998      AVX instructions also use this encoding, for some of
3999      3 argument instructions.  */
4000
4001   gas_assert (i.imm_operands <= 1
4002               && (i.operands <= 2
4003                   || (is_any_vex_encoding (&i.tm)
4004                       && i.operands <= 4)));
4005
4006   exp = &im_expressions[i.imm_operands++];
4007   i.op[i.operands].imms = exp;
4008   i.types[i.operands] = imm8;
4009   i.operands++;
4010   exp->X_op = O_constant;
4011   exp->X_add_number = i.tm.extension_opcode;
4012   i.tm.extension_opcode = None;
4013 }
4014
4015
4016 static int
4017 check_hle (void)
4018 {
4019   switch (i.tm.opcode_modifier.prefixok)
4020     {
4021     default:
4022       abort ();
4023     case PrefixLock:
4024     case PrefixNone:
4025     case PrefixNoTrack:
4026     case PrefixRep:
4027       as_bad (_("invalid instruction `%s' after `%s'"),
4028               i.tm.name, i.hle_prefix);
4029       return 0;
4030     case PrefixHLELock:
4031       if (i.prefix[LOCK_PREFIX])
4032         return 1;
4033       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4034       return 0;
4035     case PrefixHLEAny:
4036       return 1;
4037     case PrefixHLERelease:
4038       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4039         {
4040           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4041                   i.tm.name);
4042           return 0;
4043         }
4044       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4045         {
4046           as_bad (_("memory destination needed for instruction `%s'"
4047                     " after `xrelease'"), i.tm.name);
4048           return 0;
4049         }
4050       return 1;
4051     }
4052 }
4053
4054 /* Try the shortest encoding by shortening operand size.  */
4055
4056 static void
4057 optimize_encoding (void)
4058 {
4059   unsigned int j;
4060
4061   if (optimize_for_space
4062       && !is_any_vex_encoding (&i.tm)
4063       && i.reg_operands == 1
4064       && i.imm_operands == 1
4065       && !i.types[1].bitfield.byte
4066       && i.op[0].imms->X_op == O_constant
4067       && fits_in_imm7 (i.op[0].imms->X_add_number)
4068       && (i.tm.base_opcode == 0xa8
4069           || (i.tm.base_opcode == 0xf6
4070               && i.tm.extension_opcode == 0x0)))
4071     {
4072       /* Optimize: -Os:
4073            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4074        */
4075       unsigned int base_regnum = i.op[1].regs->reg_num;
4076       if (flag_code == CODE_64BIT || base_regnum < 4)
4077         {
4078           i.types[1].bitfield.byte = 1;
4079           /* Ignore the suffix.  */
4080           i.suffix = 0;
4081           /* Convert to byte registers.  */
4082           if (i.types[1].bitfield.word)
4083             j = 16;
4084           else if (i.types[1].bitfield.dword)
4085             j = 32;
4086           else
4087             j = 48;
4088           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4089             j += 8;
4090           i.op[1].regs -= j;
4091         }
4092     }
4093   else if (flag_code == CODE_64BIT
4094            && !is_any_vex_encoding (&i.tm)
4095            && ((i.types[1].bitfield.qword
4096                 && i.reg_operands == 1
4097                 && i.imm_operands == 1
4098                 && i.op[0].imms->X_op == O_constant
4099                 && ((i.tm.base_opcode == 0xb8
4100                      && i.tm.extension_opcode == None
4101                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4102                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4103                         && ((i.tm.base_opcode == 0x24
4104                              || i.tm.base_opcode == 0xa8)
4105                             || (i.tm.base_opcode == 0x80
4106                                 && i.tm.extension_opcode == 0x4)
4107                             || ((i.tm.base_opcode == 0xf6
4108                                  || (i.tm.base_opcode | 1) == 0xc7)
4109                                 && i.tm.extension_opcode == 0x0)))
4110                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4111                         && i.tm.base_opcode == 0x83
4112                         && i.tm.extension_opcode == 0x4)))
4113                || (i.types[0].bitfield.qword
4114                    && ((i.reg_operands == 2
4115                         && i.op[0].regs == i.op[1].regs
4116                         && (i.tm.base_opcode == 0x30
4117                             || i.tm.base_opcode == 0x28))
4118                        || (i.reg_operands == 1
4119                            && i.operands == 1
4120                            && i.tm.base_opcode == 0x30)))))
4121     {
4122       /* Optimize: -O:
4123            andq $imm31, %r64   -> andl $imm31, %r32
4124            andq $imm7, %r64    -> andl $imm7, %r32
4125            testq $imm31, %r64  -> testl $imm31, %r32
4126            xorq %r64, %r64     -> xorl %r32, %r32
4127            subq %r64, %r64     -> subl %r32, %r32
4128            movq $imm31, %r64   -> movl $imm31, %r32
4129            movq $imm32, %r64   -> movl $imm32, %r32
4130         */
4131       i.tm.opcode_modifier.norex64 = 1;
4132       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4133         {
4134           /* Handle
4135                movq $imm31, %r64   -> movl $imm31, %r32
4136                movq $imm32, %r64   -> movl $imm32, %r32
4137            */
4138           i.tm.operand_types[0].bitfield.imm32 = 1;
4139           i.tm.operand_types[0].bitfield.imm32s = 0;
4140           i.tm.operand_types[0].bitfield.imm64 = 0;
4141           i.types[0].bitfield.imm32 = 1;
4142           i.types[0].bitfield.imm32s = 0;
4143           i.types[0].bitfield.imm64 = 0;
4144           i.types[1].bitfield.dword = 1;
4145           i.types[1].bitfield.qword = 0;
4146           if ((i.tm.base_opcode | 1) == 0xc7)
4147             {
4148               /* Handle
4149                    movq $imm31, %r64   -> movl $imm31, %r32
4150                */
4151               i.tm.base_opcode = 0xb8;
4152               i.tm.extension_opcode = None;
4153               i.tm.opcode_modifier.w = 0;
4154               i.tm.opcode_modifier.modrm = 0;
4155             }
4156         }
4157     }
4158   else if (optimize > 1
4159            && !optimize_for_space
4160            && !is_any_vex_encoding (&i.tm)
4161            && i.reg_operands == 2
4162            && i.op[0].regs == i.op[1].regs
4163            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4164                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4165            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4166     {
4167       /* Optimize: -O2:
4168            andb %rN, %rN  -> testb %rN, %rN
4169            andw %rN, %rN  -> testw %rN, %rN
4170            andq %rN, %rN  -> testq %rN, %rN
4171            orb %rN, %rN   -> testb %rN, %rN
4172            orw %rN, %rN   -> testw %rN, %rN
4173            orq %rN, %rN   -> testq %rN, %rN
4174
4175            and outside of 64-bit mode
4176
4177            andl %rN, %rN  -> testl %rN, %rN
4178            orl %rN, %rN   -> testl %rN, %rN
4179        */
4180       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4181     }
4182   else if (i.reg_operands == 3
4183            && i.op[0].regs == i.op[1].regs
4184            && !i.types[2].bitfield.xmmword
4185            && (i.tm.opcode_modifier.vex
4186                || ((!i.mask || i.mask->zeroing)
4187                    && !i.rounding
4188                    && is_evex_encoding (&i.tm)
4189                    && (i.vec_encoding != vex_encoding_evex
4190                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4191                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4192                        || (i.tm.operand_types[2].bitfield.zmmword
4193                            && i.types[2].bitfield.ymmword))))
4194            && ((i.tm.base_opcode == 0x55
4195                 || i.tm.base_opcode == 0x6655
4196                 || i.tm.base_opcode == 0x66df
4197                 || i.tm.base_opcode == 0x57
4198                 || i.tm.base_opcode == 0x6657
4199                 || i.tm.base_opcode == 0x66ef
4200                 || i.tm.base_opcode == 0x66f8
4201                 || i.tm.base_opcode == 0x66f9
4202                 || i.tm.base_opcode == 0x66fa
4203                 || i.tm.base_opcode == 0x66fb
4204                 || i.tm.base_opcode == 0x42
4205                 || i.tm.base_opcode == 0x6642
4206                 || i.tm.base_opcode == 0x47
4207                 || i.tm.base_opcode == 0x6647)
4208                && i.tm.extension_opcode == None))
4209     {
4210       /* Optimize: -O1:
4211            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4212            vpsubq and vpsubw:
4213              EVEX VOP %zmmM, %zmmM, %zmmN
4214                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4215                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4216              EVEX VOP %ymmM, %ymmM, %ymmN
4217                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4218                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4219              VEX VOP %ymmM, %ymmM, %ymmN
4220                -> VEX VOP %xmmM, %xmmM, %xmmN
4221            VOP, one of vpandn and vpxor:
4222              VEX VOP %ymmM, %ymmM, %ymmN
4223                -> VEX VOP %xmmM, %xmmM, %xmmN
4224            VOP, one of vpandnd and vpandnq:
4225              EVEX VOP %zmmM, %zmmM, %zmmN
4226                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4227                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4228              EVEX VOP %ymmM, %ymmM, %ymmN
4229                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4230                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4231            VOP, one of vpxord and vpxorq:
4232              EVEX VOP %zmmM, %zmmM, %zmmN
4233                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4234                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4235              EVEX VOP %ymmM, %ymmM, %ymmN
4236                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4237                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4238            VOP, one of kxord and kxorq:
4239              VEX VOP %kM, %kM, %kN
4240                -> VEX kxorw %kM, %kM, %kN
4241            VOP, one of kandnd and kandnq:
4242              VEX VOP %kM, %kM, %kN
4243                -> VEX kandnw %kM, %kM, %kN
4244        */
4245       if (is_evex_encoding (&i.tm))
4246         {
4247           if (i.vec_encoding != vex_encoding_evex)
4248             {
4249               i.tm.opcode_modifier.vex = VEX128;
4250               i.tm.opcode_modifier.vexw = VEXW0;
4251               i.tm.opcode_modifier.evex = 0;
4252             }
4253           else if (optimize > 1)
4254             i.tm.opcode_modifier.evex = EVEX128;
4255           else
4256             return;
4257         }
4258       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4259         {
4260           i.tm.base_opcode &= 0xff;
4261           i.tm.opcode_modifier.vexw = VEXW0;
4262         }
4263       else
4264         i.tm.opcode_modifier.vex = VEX128;
4265
4266       if (i.tm.opcode_modifier.vex)
4267         for (j = 0; j < 3; j++)
4268           {
4269             i.types[j].bitfield.xmmword = 1;
4270             i.types[j].bitfield.ymmword = 0;
4271           }
4272     }
4273   else if (i.vec_encoding != vex_encoding_evex
4274            && !i.types[0].bitfield.zmmword
4275            && !i.types[1].bitfield.zmmword
4276            && !i.mask
4277            && !i.broadcast
4278            && is_evex_encoding (&i.tm)
4279            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4280                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4281                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4282                || (i.tm.base_opcode & ~4) == 0x66db
4283                || (i.tm.base_opcode & ~4) == 0x66eb)
4284            && i.tm.extension_opcode == None)
4285     {
4286       /* Optimize: -O1:
4287            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4288            vmovdqu32 and vmovdqu64:
4289              EVEX VOP %xmmM, %xmmN
4290                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4291              EVEX VOP %ymmM, %ymmN
4292                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4293              EVEX VOP %xmmM, mem
4294                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4295              EVEX VOP %ymmM, mem
4296                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4297              EVEX VOP mem, %xmmN
4298                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4299              EVEX VOP mem, %ymmN
4300                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4301            VOP, one of vpand, vpandn, vpor, vpxor:
4302              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4303                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4304              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4305                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4306              EVEX VOP{d,q} mem, %xmmM, %xmmN
4307                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4308              EVEX VOP{d,q} mem, %ymmM, %ymmN
4309                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4310        */
4311       for (j = 0; j < i.operands; j++)
4312         if (operand_type_check (i.types[j], disp)
4313             && i.op[j].disps->X_op == O_constant)
4314           {
4315             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4316                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4317                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4318             int evex_disp8, vex_disp8;
4319             unsigned int memshift = i.memshift;
4320             offsetT n = i.op[j].disps->X_add_number;
4321
4322             evex_disp8 = fits_in_disp8 (n);
4323             i.memshift = 0;
4324             vex_disp8 = fits_in_disp8 (n);
4325             if (evex_disp8 != vex_disp8)
4326               {
4327                 i.memshift = memshift;
4328                 return;
4329               }
4330
4331             i.types[j].bitfield.disp8 = vex_disp8;
4332             break;
4333           }
4334       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4335         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4336       i.tm.opcode_modifier.vex
4337         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4338       i.tm.opcode_modifier.vexw = VEXW0;
4339       /* VPAND, VPOR, and VPXOR are commutative.  */
4340       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4341         i.tm.opcode_modifier.commutative = 1;
4342       i.tm.opcode_modifier.evex = 0;
4343       i.tm.opcode_modifier.masking = 0;
4344       i.tm.opcode_modifier.broadcast = 0;
4345       i.tm.opcode_modifier.disp8memshift = 0;
4346       i.memshift = 0;
4347       if (j < i.operands)
4348         i.types[j].bitfield.disp8
4349           = fits_in_disp8 (i.op[j].disps->X_add_number);
4350     }
4351 }
4352
4353 /* Return non-zero for load instruction.  */
4354
4355 static int
4356 load_insn_p (void)
4357 {
4358   unsigned int dest;
4359   int any_vex_p = is_any_vex_encoding (&i.tm);
4360   unsigned int base_opcode = i.tm.base_opcode | 1;
4361
4362   if (!any_vex_p)
4363     {
4364       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4365          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4366          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4367       if (i.tm.opcode_modifier.anysize)
4368         return 0;
4369
4370       /* pop, popf, popa.   */
4371       if (strcmp (i.tm.name, "pop") == 0
4372           || i.tm.base_opcode == 0x9d
4373           || i.tm.base_opcode == 0x61)
4374         return 1;
4375
4376       /* movs, cmps, lods, scas.  */
4377       if ((i.tm.base_opcode | 0xb) == 0xaf)
4378         return 1;
4379
4380       /* outs, xlatb.  */
4381       if (base_opcode == 0x6f
4382           || i.tm.base_opcode == 0xd7)
4383         return 1;
4384       /* NB: For AMD-specific insns with implicit memory operands,
4385          they're intentionally not covered.  */
4386     }
4387
4388   /* No memory operand.  */
4389   if (!i.mem_operands)
4390     return 0;
4391
4392   if (any_vex_p)
4393     {
4394       /* vldmxcsr.  */
4395       if (i.tm.base_opcode == 0xae
4396           && i.tm.opcode_modifier.vex
4397           && i.tm.opcode_modifier.opcodespace == SPACE_0F
4398           && i.tm.extension_opcode == 2)
4399         return 1;
4400     }
4401   else
4402     {
4403       /* test, not, neg, mul, imul, div, idiv.  */
4404       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4405           && i.tm.extension_opcode != 1)
4406         return 1;
4407
4408       /* inc, dec.  */
4409       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4410         return 1;
4411
4412       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4413       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4414         return 1;
4415
4416       /* bt, bts, btr, btc.  */
4417       if (i.tm.base_opcode == 0xfba
4418           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4419         return 1;
4420
4421       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4422       if ((base_opcode == 0xc1
4423            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4424           && i.tm.extension_opcode != 6)
4425         return 1;
4426
4427       /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld.  */
4428       if (i.tm.base_opcode == 0xfc7
4429           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4430           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4431               || i.tm.extension_opcode == 6))
4432         return 1;
4433
4434       /* fxrstor, ldmxcsr, xrstor.  */
4435       if (i.tm.base_opcode == 0xfae
4436           && (i.tm.extension_opcode == 1
4437               || i.tm.extension_opcode == 2
4438               || i.tm.extension_opcode == 5))
4439         return 1;
4440
4441       /* lgdt, lidt, lmsw.  */
4442       if (i.tm.base_opcode == 0xf01
4443           && (i.tm.extension_opcode == 2
4444               || i.tm.extension_opcode == 3
4445               || i.tm.extension_opcode == 6))
4446         return 1;
4447
4448       /* Check for x87 instructions.  */
4449       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4450         {
4451           /* Skip fst, fstp, fstenv, fstcw.  */
4452           if (i.tm.base_opcode == 0xd9
4453               && (i.tm.extension_opcode == 2
4454                   || i.tm.extension_opcode == 3
4455                   || i.tm.extension_opcode == 6
4456                   || i.tm.extension_opcode == 7))
4457             return 0;
4458
4459           /* Skip fisttp, fist, fistp, fstp.  */
4460           if (i.tm.base_opcode == 0xdb
4461               && (i.tm.extension_opcode == 1
4462                   || i.tm.extension_opcode == 2
4463                   || i.tm.extension_opcode == 3
4464                   || i.tm.extension_opcode == 7))
4465             return 0;
4466
4467           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4468           if (i.tm.base_opcode == 0xdd
4469               && (i.tm.extension_opcode == 1
4470                   || i.tm.extension_opcode == 2
4471                   || i.tm.extension_opcode == 3
4472                   || i.tm.extension_opcode == 6
4473                   || i.tm.extension_opcode == 7))
4474             return 0;
4475
4476           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4477           if (i.tm.base_opcode == 0xdf
4478               && (i.tm.extension_opcode == 1
4479                   || i.tm.extension_opcode == 2
4480                   || i.tm.extension_opcode == 3
4481                   || i.tm.extension_opcode == 6
4482                   || i.tm.extension_opcode == 7))
4483             return 0;
4484
4485           return 1;
4486         }
4487     }
4488
4489   dest = i.operands - 1;
4490
4491   /* Check fake imm8 operand and 3 source operands.  */
4492   if ((i.tm.opcode_modifier.immext
4493        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4494       && i.types[dest].bitfield.imm8)
4495     dest--;
4496
4497   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4498   if (!any_vex_p
4499       && (base_opcode == 0x1
4500           || base_opcode == 0x9
4501           || base_opcode == 0x11
4502           || base_opcode == 0x19
4503           || base_opcode == 0x21
4504           || base_opcode == 0x29
4505           || base_opcode == 0x31
4506           || base_opcode == 0x39
4507           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4508           || base_opcode == 0xfc1))
4509     return 1;
4510
4511   /* Check for load instruction.  */
4512   return (i.types[dest].bitfield.class != ClassNone
4513           || i.types[dest].bitfield.instance == Accum);
4514 }
4515
4516 /* Output lfence, 0xfaee8, after instruction.  */
4517
4518 static void
4519 insert_lfence_after (void)
4520 {
4521   if (lfence_after_load && load_insn_p ())
4522     {
4523       /* There are also two REP string instructions that require
4524          special treatment. Specifically, the compare string (CMPS)
4525          and scan string (SCAS) instructions set EFLAGS in a manner
4526          that depends on the data being compared/scanned. When used
4527          with a REP prefix, the number of iterations may therefore
4528          vary depending on this data. If the data is a program secret
4529          chosen by the adversary using an LVI method,
4530          then this data-dependent behavior may leak some aspect
4531          of the secret.  */
4532       if (((i.tm.base_opcode | 0x1) == 0xa7
4533            || (i.tm.base_opcode | 0x1) == 0xaf)
4534           && i.prefix[REP_PREFIX])
4535         {
4536             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4537                      i.tm.name);
4538         }
4539       char *p = frag_more (3);
4540       *p++ = 0xf;
4541       *p++ = 0xae;
4542       *p = 0xe8;
4543     }
4544 }
4545
4546 /* Output lfence, 0xfaee8, before instruction.  */
4547
4548 static void
4549 insert_lfence_before (void)
4550 {
4551   char *p;
4552
4553   if (is_any_vex_encoding (&i.tm))
4554     return;
4555
4556   if (i.tm.base_opcode == 0xff
4557       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4558     {
4559       /* Insert lfence before indirect branch if needed.  */
4560
4561       if (lfence_before_indirect_branch == lfence_branch_none)
4562         return;
4563
4564       if (i.operands != 1)
4565         abort ();
4566
4567       if (i.reg_operands == 1)
4568         {
4569           /* Indirect branch via register.  Don't insert lfence with
4570              -mlfence-after-load=yes.  */
4571           if (lfence_after_load
4572               || lfence_before_indirect_branch == lfence_branch_memory)
4573             return;
4574         }
4575       else if (i.mem_operands == 1
4576                && lfence_before_indirect_branch != lfence_branch_register)
4577         {
4578           as_warn (_("indirect `%s` with memory operand should be avoided"),
4579                    i.tm.name);
4580           return;
4581         }
4582       else
4583         return;
4584
4585       if (last_insn.kind != last_insn_other
4586           && last_insn.seg == now_seg)
4587         {
4588           as_warn_where (last_insn.file, last_insn.line,
4589                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4590                          last_insn.name, i.tm.name);
4591           return;
4592         }
4593
4594       p = frag_more (3);
4595       *p++ = 0xf;
4596       *p++ = 0xae;
4597       *p = 0xe8;
4598       return;
4599     }
4600
4601   /* Output or/not/shl and lfence before near ret.  */
4602   if (lfence_before_ret != lfence_before_ret_none
4603       && (i.tm.base_opcode == 0xc2
4604           || i.tm.base_opcode == 0xc3))
4605     {
4606       if (last_insn.kind != last_insn_other
4607           && last_insn.seg == now_seg)
4608         {
4609           as_warn_where (last_insn.file, last_insn.line,
4610                          _("`%s` skips -mlfence-before-ret on `%s`"),
4611                          last_insn.name, i.tm.name);
4612           return;
4613         }
4614
4615       /* Near ret ingore operand size override under CPU64.  */
4616       char prefix = flag_code == CODE_64BIT
4617                     ? 0x48
4618                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4619
4620       if (lfence_before_ret == lfence_before_ret_not)
4621         {
4622           /* not: 0xf71424, may add prefix
4623              for operand size override or 64-bit code.  */
4624           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4625           if (prefix)
4626             *p++ = prefix;
4627           *p++ = 0xf7;
4628           *p++ = 0x14;
4629           *p++ = 0x24;
4630           if (prefix)
4631             *p++ = prefix;
4632           *p++ = 0xf7;
4633           *p++ = 0x14;
4634           *p++ = 0x24;
4635         }
4636       else
4637         {
4638           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4639           if (prefix)
4640             *p++ = prefix;
4641           if (lfence_before_ret == lfence_before_ret_or)
4642             {
4643               /* or: 0x830c2400, may add prefix
4644                  for operand size override or 64-bit code.  */
4645               *p++ = 0x83;
4646               *p++ = 0x0c;
4647             }
4648           else
4649             {
4650               /* shl: 0xc1242400, may add prefix
4651                  for operand size override or 64-bit code.  */
4652               *p++ = 0xc1;
4653               *p++ = 0x24;
4654             }
4655
4656           *p++ = 0x24;
4657           *p++ = 0x0;
4658         }
4659
4660       *p++ = 0xf;
4661       *p++ = 0xae;
4662       *p = 0xe8;
4663     }
4664 }
4665
4666 /* This is the guts of the machine-dependent assembler.  LINE points to a
4667    machine dependent instruction.  This function is supposed to emit
4668    the frags/bytes it assembles to.  */
4669
4670 void
4671 md_assemble (char *line)
4672 {
4673   unsigned int j;
4674   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4675   const insn_template *t;
4676
4677   /* Initialize globals.  */
4678   memset (&i, '\0', sizeof (i));
4679   for (j = 0; j < MAX_OPERANDS; j++)
4680     i.reloc[j] = NO_RELOC;
4681   memset (disp_expressions, '\0', sizeof (disp_expressions));
4682   memset (im_expressions, '\0', sizeof (im_expressions));
4683   save_stack_p = save_stack;
4684
4685   /* First parse an instruction mnemonic & call i386_operand for the operands.
4686      We assume that the scrubber has arranged it so that line[0] is the valid
4687      start of a (possibly prefixed) mnemonic.  */
4688
4689   line = parse_insn (line, mnemonic);
4690   if (line == NULL)
4691     return;
4692   mnem_suffix = i.suffix;
4693
4694   line = parse_operands (line, mnemonic);
4695   this_operand = -1;
4696   xfree (i.memop1_string);
4697   i.memop1_string = NULL;
4698   if (line == NULL)
4699     return;
4700
4701   /* Now we've parsed the mnemonic into a set of templates, and have the
4702      operands at hand.  */
4703
4704   /* All Intel opcodes have reversed operands except for "bound", "enter",
4705      "monitor*", "mwait*", "tpause", and "umwait".  We also don't reverse
4706      intersegment "jmp" and "call" instructions with 2 immediate operands so
4707      that the immediate segment precedes the offset, as it does when in AT&T
4708      mode.  */
4709   if (intel_syntax
4710       && i.operands > 1
4711       && (strcmp (mnemonic, "bound") != 0)
4712       && (strcmp (mnemonic, "invlpga") != 0)
4713       && (strncmp (mnemonic, "monitor", 7) != 0)
4714       && (strncmp (mnemonic, "mwait", 5) != 0)
4715       && (strcmp (mnemonic, "tpause") != 0)
4716       && (strcmp (mnemonic, "umwait") != 0)
4717       && !(operand_type_check (i.types[0], imm)
4718            && operand_type_check (i.types[1], imm)))
4719     swap_operands ();
4720
4721   /* The order of the immediates should be reversed
4722      for 2 immediates extrq and insertq instructions */
4723   if (i.imm_operands == 2
4724       && (strcmp (mnemonic, "extrq") == 0
4725           || strcmp (mnemonic, "insertq") == 0))
4726       swap_2_operands (0, 1);
4727
4728   if (i.imm_operands)
4729     optimize_imm ();
4730
4731   /* Don't optimize displacement for movabs since it only takes 64bit
4732      displacement.  */
4733   if (i.disp_operands
4734       && i.disp_encoding != disp_encoding_32bit
4735       && (flag_code != CODE_64BIT
4736           || strcmp (mnemonic, "movabs") != 0))
4737     optimize_disp ();
4738
4739   /* Next, we find a template that matches the given insn,
4740      making sure the overlap of the given operands types is consistent
4741      with the template operand types.  */
4742
4743   if (!(t = match_template (mnem_suffix)))
4744     return;
4745
4746   if (sse_check != check_none
4747       && !i.tm.opcode_modifier.noavx
4748       && !i.tm.cpu_flags.bitfield.cpuavx
4749       && !i.tm.cpu_flags.bitfield.cpuavx512f
4750       && (i.tm.cpu_flags.bitfield.cpusse
4751           || i.tm.cpu_flags.bitfield.cpusse2
4752           || i.tm.cpu_flags.bitfield.cpusse3
4753           || i.tm.cpu_flags.bitfield.cpussse3
4754           || i.tm.cpu_flags.bitfield.cpusse4_1
4755           || i.tm.cpu_flags.bitfield.cpusse4_2
4756           || i.tm.cpu_flags.bitfield.cpupclmul
4757           || i.tm.cpu_flags.bitfield.cpuaes
4758           || i.tm.cpu_flags.bitfield.cpusha
4759           || i.tm.cpu_flags.bitfield.cpugfni))
4760     {
4761       (sse_check == check_warning
4762        ? as_warn
4763        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4764     }
4765
4766   if (i.tm.opcode_modifier.fwait)
4767     if (!add_prefix (FWAIT_OPCODE))
4768       return;
4769
4770   /* Check if REP prefix is OK.  */
4771   if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4772     {
4773       as_bad (_("invalid instruction `%s' after `%s'"),
4774                 i.tm.name, i.rep_prefix);
4775       return;
4776     }
4777
4778   /* Check for lock without a lockable instruction.  Destination operand
4779      must be memory unless it is xchg (0x86).  */
4780   if (i.prefix[LOCK_PREFIX]
4781       && (i.tm.opcode_modifier.prefixok < PrefixLock
4782           || i.mem_operands == 0
4783           || (i.tm.base_opcode != 0x86
4784               && !(i.flags[i.operands - 1] & Operand_Mem))))
4785     {
4786       as_bad (_("expecting lockable instruction after `lock'"));
4787       return;
4788     }
4789
4790   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4791   if (i.prefix[DATA_PREFIX]
4792       && (is_any_vex_encoding (&i.tm)
4793           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4794           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4795     {
4796       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4797       return;
4798     }
4799
4800   /* Check if HLE prefix is OK.  */
4801   if (i.hle_prefix && !check_hle ())
4802     return;
4803
4804   /* Check BND prefix.  */
4805   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4806     as_bad (_("expecting valid branch instruction after `bnd'"));
4807
4808   /* Check NOTRACK prefix.  */
4809   if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
4810     as_bad (_("expecting indirect branch instruction after `notrack'"));
4811
4812   if (i.tm.cpu_flags.bitfield.cpumpx)
4813     {
4814       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4815         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4816       else if (flag_code != CODE_16BIT
4817                ? i.prefix[ADDR_PREFIX]
4818                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4819         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4820     }
4821
4822   /* Insert BND prefix.  */
4823   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4824     {
4825       if (!i.prefix[BND_PREFIX])
4826         add_prefix (BND_PREFIX_OPCODE);
4827       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4828         {
4829           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4830           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4831         }
4832     }
4833
4834   /* Check string instruction segment overrides.  */
4835   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4836     {
4837       gas_assert (i.mem_operands);
4838       if (!check_string ())
4839         return;
4840       i.disp_operands = 0;
4841     }
4842
4843   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4844     optimize_encoding ();
4845
4846   if (!process_suffix ())
4847     return;
4848
4849   /* Update operand types and check extended states.  */
4850   for (j = 0; j < i.operands; j++)
4851     {
4852       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853       switch (i.tm.operand_types[j].bitfield.class)
4854         {
4855         default:
4856           break;
4857         case RegMMX:
4858           i.xstate |= xstate_mmx;
4859           break;
4860         case RegMask:
4861           i.xstate |= xstate_mask;
4862           break;
4863         case RegSIMD:
4864           if (i.tm.operand_types[j].bitfield.tmmword)
4865             i.xstate |= xstate_tmm;
4866           else if (i.tm.operand_types[j].bitfield.zmmword)
4867             i.xstate |= xstate_zmm;
4868           else if (i.tm.operand_types[j].bitfield.ymmword)
4869             i.xstate |= xstate_ymm;
4870           else if (i.tm.operand_types[j].bitfield.xmmword)
4871             i.xstate |= xstate_xmm;
4872           break;
4873         }
4874     }
4875
4876   /* Make still unresolved immediate matches conform to size of immediate
4877      given in i.suffix.  */
4878   if (!finalize_imm ())
4879     return;
4880
4881   if (i.types[0].bitfield.imm1)
4882     i.imm_operands = 0; /* kludge for shift insns.  */
4883
4884   /* We only need to check those implicit registers for instructions
4885      with 3 operands or less.  */
4886   if (i.operands <= 3)
4887     for (j = 0; j < i.operands; j++)
4888       if (i.types[j].bitfield.instance != InstanceNone
4889           && !i.types[j].bitfield.xmmword)
4890         i.reg_operands--;
4891
4892   /* For insns with operands there are more diddles to do to the opcode.  */
4893   if (i.operands)
4894     {
4895       if (!process_operands ())
4896         return;
4897     }
4898   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4899     {
4900       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4901       as_warn (_("translating to `%sp'"), i.tm.name);
4902     }
4903
4904   if (is_any_vex_encoding (&i.tm))
4905     {
4906       if (!cpu_arch_flags.bitfield.cpui286)
4907         {
4908           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4909                   i.tm.name);
4910           return;
4911         }
4912
4913       /* Check for explicit REX prefix.  */
4914       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4915         {
4916           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4917           return;
4918         }
4919
4920       if (i.tm.opcode_modifier.vex)
4921         build_vex_prefix (t);
4922       else
4923         build_evex_prefix ();
4924
4925       /* The individual REX.RXBW bits got consumed.  */
4926       i.rex &= REX_OPCODE;
4927     }
4928
4929   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4930      instructions may define INT_OPCODE as well, so avoid this corner
4931      case for those instructions that use MODRM.  */
4932   if (i.tm.base_opcode == INT_OPCODE
4933       && !i.tm.opcode_modifier.modrm
4934       && i.op[0].imms->X_add_number == 3)
4935     {
4936       i.tm.base_opcode = INT3_OPCODE;
4937       i.imm_operands = 0;
4938     }
4939
4940   if ((i.tm.opcode_modifier.jump == JUMP
4941        || i.tm.opcode_modifier.jump == JUMP_BYTE
4942        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4943       && i.op[0].disps->X_op == O_constant)
4944     {
4945       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4946          the absolute address given by the constant.  Since ix86 jumps and
4947          calls are pc relative, we need to generate a reloc.  */
4948       i.op[0].disps->X_add_symbol = &abs_symbol;
4949       i.op[0].disps->X_op = O_symbol;
4950     }
4951
4952   /* For 8 bit registers we need an empty rex prefix.  Also if the
4953      instruction already has a prefix, we need to convert old
4954      registers to new ones.  */
4955
4956   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4957        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4958       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4959           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4960       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4961            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4962           && i.rex != 0))
4963     {
4964       int x;
4965
4966       i.rex |= REX_OPCODE;
4967       for (x = 0; x < 2; x++)
4968         {
4969           /* Look for 8 bit operand that uses old registers.  */
4970           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4971               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4972             {
4973               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4974               /* In case it is "hi" register, give up.  */
4975               if (i.op[x].regs->reg_num > 3)
4976                 as_bad (_("can't encode register '%s%s' in an "
4977                           "instruction requiring REX prefix."),
4978                         register_prefix, i.op[x].regs->reg_name);
4979
4980               /* Otherwise it is equivalent to the extended register.
4981                  Since the encoding doesn't change this is merely
4982                  cosmetic cleanup for debug output.  */
4983
4984               i.op[x].regs = i.op[x].regs + 8;
4985             }
4986         }
4987     }
4988
4989   if (i.rex == 0 && i.rex_encoding)
4990     {
4991       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4992          that uses legacy register.  If it is "hi" register, don't add
4993          the REX_OPCODE byte.  */
4994       int x;
4995       for (x = 0; x < 2; x++)
4996         if (i.types[x].bitfield.class == Reg
4997             && i.types[x].bitfield.byte
4998             && (i.op[x].regs->reg_flags & RegRex64) == 0
4999             && i.op[x].regs->reg_num > 3)
5000           {
5001             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5002             i.rex_encoding = FALSE;
5003             break;
5004           }
5005
5006       if (i.rex_encoding)
5007         i.rex = REX_OPCODE;
5008     }
5009
5010   if (i.rex != 0)
5011     add_prefix (REX_OPCODE | i.rex);
5012
5013   insert_lfence_before ();
5014
5015   /* We are ready to output the insn.  */
5016   output_insn ();
5017
5018   insert_lfence_after ();
5019
5020   last_insn.seg = now_seg;
5021
5022   if (i.tm.opcode_modifier.isprefix)
5023     {
5024       last_insn.kind = last_insn_prefix;
5025       last_insn.name = i.tm.name;
5026       last_insn.file = as_where (&last_insn.line);
5027     }
5028   else
5029     last_insn.kind = last_insn_other;
5030 }
5031
5032 static char *
5033 parse_insn (char *line, char *mnemonic)
5034 {
5035   char *l = line;
5036   char *token_start = l;
5037   char *mnem_p;
5038   int supported;
5039   const insn_template *t;
5040   char *dot_p = NULL;
5041
5042   while (1)
5043     {
5044       mnem_p = mnemonic;
5045       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5046         {
5047           if (*mnem_p == '.')
5048             dot_p = mnem_p;
5049           mnem_p++;
5050           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5051             {
5052               as_bad (_("no such instruction: `%s'"), token_start);
5053               return NULL;
5054             }
5055           l++;
5056         }
5057       if (!is_space_char (*l)
5058           && *l != END_OF_INSN
5059           && (intel_syntax
5060               || (*l != PREFIX_SEPARATOR
5061                   && *l != ',')))
5062         {
5063           as_bad (_("invalid character %s in mnemonic"),
5064                   output_invalid (*l));
5065           return NULL;
5066         }
5067       if (token_start == l)
5068         {
5069           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5070             as_bad (_("expecting prefix; got nothing"));
5071           else
5072             as_bad (_("expecting mnemonic; got nothing"));
5073           return NULL;
5074         }
5075
5076       /* Look up instruction (or prefix) via hash table.  */
5077       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5078
5079       if (*l != END_OF_INSN
5080           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5081           && current_templates
5082           && current_templates->start->opcode_modifier.isprefix)
5083         {
5084           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5085             {
5086               as_bad ((flag_code != CODE_64BIT
5087                        ? _("`%s' is only supported in 64-bit mode")
5088                        : _("`%s' is not supported in 64-bit mode")),
5089                       current_templates->start->name);
5090               return NULL;
5091             }
5092           /* If we are in 16-bit mode, do not allow addr16 or data16.
5093              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5094           if ((current_templates->start->opcode_modifier.size == SIZE16
5095                || current_templates->start->opcode_modifier.size == SIZE32)
5096               && flag_code != CODE_64BIT
5097               && ((current_templates->start->opcode_modifier.size == SIZE32)
5098                   ^ (flag_code == CODE_16BIT)))
5099             {
5100               as_bad (_("redundant %s prefix"),
5101                       current_templates->start->name);
5102               return NULL;
5103             }
5104           if (current_templates->start->opcode_length == 0)
5105             {
5106               /* Handle pseudo prefixes.  */
5107               switch (current_templates->start->base_opcode)
5108                 {
5109                 case Prefix_Disp8:
5110                   /* {disp8} */
5111                   i.disp_encoding = disp_encoding_8bit;
5112                   break;
5113                 case Prefix_Disp16:
5114                   /* {disp16} */
5115                   i.disp_encoding = disp_encoding_16bit;
5116                   break;
5117                 case Prefix_Disp32:
5118                   /* {disp32} */
5119                   i.disp_encoding = disp_encoding_32bit;
5120                   break;
5121                 case Prefix_Load:
5122                   /* {load} */
5123                   i.dir_encoding = dir_encoding_load;
5124                   break;
5125                 case Prefix_Store:
5126                   /* {store} */
5127                   i.dir_encoding = dir_encoding_store;
5128                   break;
5129                 case Prefix_VEX:
5130                   /* {vex} */
5131                   i.vec_encoding = vex_encoding_vex;
5132                   break;
5133                 case Prefix_VEX3:
5134                   /* {vex3} */
5135                   i.vec_encoding = vex_encoding_vex3;
5136                   break;
5137                 case Prefix_EVEX:
5138                   /* {evex} */
5139                   i.vec_encoding = vex_encoding_evex;
5140                   break;
5141                 case Prefix_REX:
5142                   /* {rex} */
5143                   i.rex_encoding = TRUE;
5144                   break;
5145                 case Prefix_NoOptimize:
5146                   /* {nooptimize} */
5147                   i.no_optimize = TRUE;
5148                   break;
5149                 default:
5150                   abort ();
5151                 }
5152             }
5153           else
5154             {
5155               /* Add prefix, checking for repeated prefixes.  */
5156               switch (add_prefix (current_templates->start->base_opcode))
5157                 {
5158                 case PREFIX_EXIST:
5159                   return NULL;
5160                 case PREFIX_DS:
5161                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5162                     i.notrack_prefix = current_templates->start->name;
5163                   break;
5164                 case PREFIX_REP:
5165                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5166                     i.hle_prefix = current_templates->start->name;
5167                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5168                     i.bnd_prefix = current_templates->start->name;
5169                   else
5170                     i.rep_prefix = current_templates->start->name;
5171                   break;
5172                 default:
5173                   break;
5174                 }
5175             }
5176           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5177           token_start = ++l;
5178         }
5179       else
5180         break;
5181     }
5182
5183   if (!current_templates)
5184     {
5185       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5186          Check if we should swap operand or force 32bit displacement in
5187          encoding.  */
5188       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5189         i.dir_encoding = dir_encoding_swap;
5190       else if (mnem_p - 3 == dot_p
5191                && dot_p[1] == 'd'
5192                && dot_p[2] == '8')
5193         i.disp_encoding = disp_encoding_8bit;
5194       else if (mnem_p - 4 == dot_p
5195                && dot_p[1] == 'd'
5196                && dot_p[2] == '3'
5197                && dot_p[3] == '2')
5198         i.disp_encoding = disp_encoding_32bit;
5199       else
5200         goto check_suffix;
5201       mnem_p = dot_p;
5202       *dot_p = '\0';
5203       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5204     }
5205
5206   if (!current_templates)
5207     {
5208     check_suffix:
5209       if (mnem_p > mnemonic)
5210         {
5211           /* See if we can get a match by trimming off a suffix.  */
5212           switch (mnem_p[-1])
5213             {
5214             case WORD_MNEM_SUFFIX:
5215               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5216                 i.suffix = SHORT_MNEM_SUFFIX;
5217               else
5218                 /* Fall through.  */
5219               case BYTE_MNEM_SUFFIX:
5220               case QWORD_MNEM_SUFFIX:
5221                 i.suffix = mnem_p[-1];
5222               mnem_p[-1] = '\0';
5223               current_templates
5224                 = (const templates *) str_hash_find (op_hash, mnemonic);
5225               break;
5226             case SHORT_MNEM_SUFFIX:
5227             case LONG_MNEM_SUFFIX:
5228               if (!intel_syntax)
5229                 {
5230                   i.suffix = mnem_p[-1];
5231                   mnem_p[-1] = '\0';
5232                   current_templates
5233                     = (const templates *) str_hash_find (op_hash, mnemonic);
5234                 }
5235               break;
5236
5237               /* Intel Syntax.  */
5238             case 'd':
5239               if (intel_syntax)
5240                 {
5241                   if (intel_float_operand (mnemonic) == 1)
5242                     i.suffix = SHORT_MNEM_SUFFIX;
5243                   else
5244                     i.suffix = LONG_MNEM_SUFFIX;
5245                   mnem_p[-1] = '\0';
5246                   current_templates
5247                     = (const templates *) str_hash_find (op_hash, mnemonic);
5248                 }
5249               break;
5250             }
5251         }
5252
5253       if (!current_templates)
5254         {
5255           as_bad (_("no such instruction: `%s'"), token_start);
5256           return NULL;
5257         }
5258     }
5259
5260   if (current_templates->start->opcode_modifier.jump == JUMP
5261       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5262     {
5263       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5264          predict taken and predict not taken respectively.
5265          I'm not sure that branch hints actually do anything on loop
5266          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5267          may work in the future and it doesn't hurt to accept them
5268          now.  */
5269       if (l[0] == ',' && l[1] == 'p')
5270         {
5271           if (l[2] == 't')
5272             {
5273               if (!add_prefix (DS_PREFIX_OPCODE))
5274                 return NULL;
5275               l += 3;
5276             }
5277           else if (l[2] == 'n')
5278             {
5279               if (!add_prefix (CS_PREFIX_OPCODE))
5280                 return NULL;
5281               l += 3;
5282             }
5283         }
5284     }
5285   /* Any other comma loses.  */
5286   if (*l == ',')
5287     {
5288       as_bad (_("invalid character %s in mnemonic"),
5289               output_invalid (*l));
5290       return NULL;
5291     }
5292
5293   /* Check if instruction is supported on specified architecture.  */
5294   supported = 0;
5295   for (t = current_templates->start; t < current_templates->end; ++t)
5296     {
5297       supported |= cpu_flags_match (t);
5298       if (supported == CPU_FLAGS_PERFECT_MATCH)
5299         {
5300           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5301             as_warn (_("use .code16 to ensure correct addressing mode"));
5302
5303           return l;
5304         }
5305     }
5306
5307   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5308     as_bad (flag_code == CODE_64BIT
5309             ? _("`%s' is not supported in 64-bit mode")
5310             : _("`%s' is only supported in 64-bit mode"),
5311             current_templates->start->name);
5312   else
5313     as_bad (_("`%s' is not supported on `%s%s'"),
5314             current_templates->start->name,
5315             cpu_arch_name ? cpu_arch_name : default_arch,
5316             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5317
5318   return NULL;
5319 }
5320
5321 static char *
5322 parse_operands (char *l, const char *mnemonic)
5323 {
5324   char *token_start;
5325
5326   /* 1 if operand is pending after ','.  */
5327   unsigned int expecting_operand = 0;
5328
5329   /* Non-zero if operand parens not balanced.  */
5330   unsigned int paren_not_balanced;
5331
5332   while (*l != END_OF_INSN)
5333     {
5334       /* Skip optional white space before operand.  */
5335       if (is_space_char (*l))
5336         ++l;
5337       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5338         {
5339           as_bad (_("invalid character %s before operand %d"),
5340                   output_invalid (*l),
5341                   i.operands + 1);
5342           return NULL;
5343         }
5344       token_start = l;  /* After white space.  */
5345       paren_not_balanced = 0;
5346       while (paren_not_balanced || *l != ',')
5347         {
5348           if (*l == END_OF_INSN)
5349             {
5350               if (paren_not_balanced)
5351                 {
5352                   if (!intel_syntax)
5353                     as_bad (_("unbalanced parenthesis in operand %d."),
5354                             i.operands + 1);
5355                   else
5356                     as_bad (_("unbalanced brackets in operand %d."),
5357                             i.operands + 1);
5358                   return NULL;
5359                 }
5360               else
5361                 break;  /* we are done */
5362             }
5363           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5364             {
5365               as_bad (_("invalid character %s in operand %d"),
5366                       output_invalid (*l),
5367                       i.operands + 1);
5368               return NULL;
5369             }
5370           if (!intel_syntax)
5371             {
5372               if (*l == '(')
5373                 ++paren_not_balanced;
5374               if (*l == ')')
5375                 --paren_not_balanced;
5376             }
5377           else
5378             {
5379               if (*l == '[')
5380                 ++paren_not_balanced;
5381               if (*l == ']')
5382                 --paren_not_balanced;
5383             }
5384           l++;
5385         }
5386       if (l != token_start)
5387         {                       /* Yes, we've read in another operand.  */
5388           unsigned int operand_ok;
5389           this_operand = i.operands++;
5390           if (i.operands > MAX_OPERANDS)
5391             {
5392               as_bad (_("spurious operands; (%d operands/instruction max)"),
5393                       MAX_OPERANDS);
5394               return NULL;
5395             }
5396           i.types[this_operand].bitfield.unspecified = 1;
5397           /* Now parse operand adding info to 'i' as we go along.  */
5398           END_STRING_AND_SAVE (l);
5399
5400           if (i.mem_operands > 1)
5401             {
5402               as_bad (_("too many memory references for `%s'"),
5403                       mnemonic);
5404               return 0;
5405             }
5406
5407           if (intel_syntax)
5408             operand_ok =
5409               i386_intel_operand (token_start,
5410                                   intel_float_operand (mnemonic));
5411           else
5412             operand_ok = i386_att_operand (token_start);
5413
5414           RESTORE_END_STRING (l);
5415           if (!operand_ok)
5416             return NULL;
5417         }
5418       else
5419         {
5420           if (expecting_operand)
5421             {
5422             expecting_operand_after_comma:
5423               as_bad (_("expecting operand after ','; got nothing"));
5424               return NULL;
5425             }
5426           if (*l == ',')
5427             {
5428               as_bad (_("expecting operand before ','; got nothing"));
5429               return NULL;
5430             }
5431         }
5432
5433       /* Now *l must be either ',' or END_OF_INSN.  */
5434       if (*l == ',')
5435         {
5436           if (*++l == END_OF_INSN)
5437             {
5438               /* Just skip it, if it's \n complain.  */
5439               goto expecting_operand_after_comma;
5440             }
5441           expecting_operand = 1;
5442         }
5443     }
5444   return l;
5445 }
5446
5447 static void
5448 swap_2_operands (int xchg1, int xchg2)
5449 {
5450   union i386_op temp_op;
5451   i386_operand_type temp_type;
5452   unsigned int temp_flags;
5453   enum bfd_reloc_code_real temp_reloc;
5454
5455   temp_type = i.types[xchg2];
5456   i.types[xchg2] = i.types[xchg1];
5457   i.types[xchg1] = temp_type;
5458
5459   temp_flags = i.flags[xchg2];
5460   i.flags[xchg2] = i.flags[xchg1];
5461   i.flags[xchg1] = temp_flags;
5462
5463   temp_op = i.op[xchg2];
5464   i.op[xchg2] = i.op[xchg1];
5465   i.op[xchg1] = temp_op;
5466
5467   temp_reloc = i.reloc[xchg2];
5468   i.reloc[xchg2] = i.reloc[xchg1];
5469   i.reloc[xchg1] = temp_reloc;
5470
5471   if (i.mask)
5472     {
5473       if (i.mask->operand == xchg1)
5474         i.mask->operand = xchg2;
5475       else if (i.mask->operand == xchg2)
5476         i.mask->operand = xchg1;
5477     }
5478   if (i.broadcast)
5479     {
5480       if (i.broadcast->operand == xchg1)
5481         i.broadcast->operand = xchg2;
5482       else if (i.broadcast->operand == xchg2)
5483         i.broadcast->operand = xchg1;
5484     }
5485   if (i.rounding)
5486     {
5487       if (i.rounding->operand == xchg1)
5488         i.rounding->operand = xchg2;
5489       else if (i.rounding->operand == xchg2)
5490         i.rounding->operand = xchg1;
5491     }
5492 }
5493
5494 static void
5495 swap_operands (void)
5496 {
5497   switch (i.operands)
5498     {
5499     case 5:
5500     case 4:
5501       swap_2_operands (1, i.operands - 2);
5502       /* Fall through.  */
5503     case 3:
5504     case 2:
5505       swap_2_operands (0, i.operands - 1);
5506       break;
5507     default:
5508       abort ();
5509     }
5510
5511   if (i.mem_operands == 2)
5512     {
5513       const seg_entry *temp_seg;
5514       temp_seg = i.seg[0];
5515       i.seg[0] = i.seg[1];
5516       i.seg[1] = temp_seg;
5517     }
5518 }
5519
5520 /* Try to ensure constant immediates are represented in the smallest
5521    opcode possible.  */
5522 static void
5523 optimize_imm (void)
5524 {
5525   char guess_suffix = 0;
5526   int op;
5527
5528   if (i.suffix)
5529     guess_suffix = i.suffix;
5530   else if (i.reg_operands)
5531     {
5532       /* Figure out a suffix from the last register operand specified.
5533          We can't do this properly yet, i.e. excluding special register
5534          instances, but the following works for instructions with
5535          immediates.  In any case, we can't set i.suffix yet.  */
5536       for (op = i.operands; --op >= 0;)
5537         if (i.types[op].bitfield.class != Reg)
5538           continue;
5539         else if (i.types[op].bitfield.byte)
5540           {
5541             guess_suffix = BYTE_MNEM_SUFFIX;
5542             break;
5543           }
5544         else if (i.types[op].bitfield.word)
5545           {
5546             guess_suffix = WORD_MNEM_SUFFIX;
5547             break;
5548           }
5549         else if (i.types[op].bitfield.dword)
5550           {
5551             guess_suffix = LONG_MNEM_SUFFIX;
5552             break;
5553           }
5554         else if (i.types[op].bitfield.qword)
5555           {
5556             guess_suffix = QWORD_MNEM_SUFFIX;
5557             break;
5558           }
5559     }
5560   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5561     guess_suffix = WORD_MNEM_SUFFIX;
5562
5563   for (op = i.operands; --op >= 0;)
5564     if (operand_type_check (i.types[op], imm))
5565       {
5566         switch (i.op[op].imms->X_op)
5567           {
5568           case O_constant:
5569             /* If a suffix is given, this operand may be shortened.  */
5570             switch (guess_suffix)
5571               {
5572               case LONG_MNEM_SUFFIX:
5573                 i.types[op].bitfield.imm32 = 1;
5574                 i.types[op].bitfield.imm64 = 1;
5575                 break;
5576               case WORD_MNEM_SUFFIX:
5577                 i.types[op].bitfield.imm16 = 1;
5578                 i.types[op].bitfield.imm32 = 1;
5579                 i.types[op].bitfield.imm32s = 1;
5580                 i.types[op].bitfield.imm64 = 1;
5581                 break;
5582               case BYTE_MNEM_SUFFIX:
5583                 i.types[op].bitfield.imm8 = 1;
5584                 i.types[op].bitfield.imm8s = 1;
5585                 i.types[op].bitfield.imm16 = 1;
5586                 i.types[op].bitfield.imm32 = 1;
5587                 i.types[op].bitfield.imm32s = 1;
5588                 i.types[op].bitfield.imm64 = 1;
5589                 break;
5590               }
5591
5592             /* If this operand is at most 16 bits, convert it
5593                to a signed 16 bit number before trying to see
5594                whether it will fit in an even smaller size.
5595                This allows a 16-bit operand such as $0xffe0 to
5596                be recognised as within Imm8S range.  */
5597             if ((i.types[op].bitfield.imm16)
5598                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5599               {
5600                 i.op[op].imms->X_add_number =
5601                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5602               }
5603 #ifdef BFD64
5604             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5605             if ((i.types[op].bitfield.imm32)
5606                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5607                     == 0))
5608               {
5609                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5610                                                 ^ ((offsetT) 1 << 31))
5611                                                - ((offsetT) 1 << 31));
5612               }
5613 #endif
5614             i.types[op]
5615               = operand_type_or (i.types[op],
5616                                  smallest_imm_type (i.op[op].imms->X_add_number));
5617
5618             /* We must avoid matching of Imm32 templates when 64bit
5619                only immediate is available.  */
5620             if (guess_suffix == QWORD_MNEM_SUFFIX)
5621               i.types[op].bitfield.imm32 = 0;
5622             break;
5623
5624           case O_absent:
5625           case O_register:
5626             abort ();
5627
5628             /* Symbols and expressions.  */
5629           default:
5630             /* Convert symbolic operand to proper sizes for matching, but don't
5631                prevent matching a set of insns that only supports sizes other
5632                than those matching the insn suffix.  */
5633             {
5634               i386_operand_type mask, allowed;
5635               const insn_template *t;
5636
5637               operand_type_set (&mask, 0);
5638               operand_type_set (&allowed, 0);
5639
5640               for (t = current_templates->start;
5641                    t < current_templates->end;
5642                    ++t)
5643                 {
5644                   allowed = operand_type_or (allowed, t->operand_types[op]);
5645                   allowed = operand_type_and (allowed, anyimm);
5646                 }
5647               switch (guess_suffix)
5648                 {
5649                 case QWORD_MNEM_SUFFIX:
5650                   mask.bitfield.imm64 = 1;
5651                   mask.bitfield.imm32s = 1;
5652                   break;
5653                 case LONG_MNEM_SUFFIX:
5654                   mask.bitfield.imm32 = 1;
5655                   break;
5656                 case WORD_MNEM_SUFFIX:
5657                   mask.bitfield.imm16 = 1;
5658                   break;
5659                 case BYTE_MNEM_SUFFIX:
5660                   mask.bitfield.imm8 = 1;
5661                   break;
5662                 default:
5663                   break;
5664                 }
5665               allowed = operand_type_and (mask, allowed);
5666               if (!operand_type_all_zero (&allowed))
5667                 i.types[op] = operand_type_and (i.types[op], mask);
5668             }
5669             break;
5670           }
5671       }
5672 }
5673
5674 /* Try to use the smallest displacement type too.  */
5675 static void
5676 optimize_disp (void)
5677 {
5678   int op;
5679
5680   for (op = i.operands; --op >= 0;)
5681     if (operand_type_check (i.types[op], disp))
5682       {
5683         if (i.op[op].disps->X_op == O_constant)
5684           {
5685             offsetT op_disp = i.op[op].disps->X_add_number;
5686
5687             if (i.types[op].bitfield.disp16
5688                 && (op_disp & ~(offsetT) 0xffff) == 0)
5689               {
5690                 /* If this operand is at most 16 bits, convert
5691                    to a signed 16 bit number and don't use 64bit
5692                    displacement.  */
5693                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5694                 i.types[op].bitfield.disp64 = 0;
5695               }
5696 #ifdef BFD64
5697             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5698             if (i.types[op].bitfield.disp32
5699                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5700               {
5701                 /* If this operand is at most 32 bits, convert
5702                    to a signed 32 bit number and don't use 64bit
5703                    displacement.  */
5704                 op_disp &= (((offsetT) 2 << 31) - 1);
5705                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5706                 i.types[op].bitfield.disp64 = 0;
5707               }
5708 #endif
5709             if (!op_disp && i.types[op].bitfield.baseindex)
5710               {
5711                 i.types[op].bitfield.disp8 = 0;
5712                 i.types[op].bitfield.disp16 = 0;
5713                 i.types[op].bitfield.disp32 = 0;
5714                 i.types[op].bitfield.disp32s = 0;
5715                 i.types[op].bitfield.disp64 = 0;
5716                 i.op[op].disps = 0;
5717                 i.disp_operands--;
5718               }
5719             else if (flag_code == CODE_64BIT)
5720               {
5721                 if (fits_in_signed_long (op_disp))
5722                   {
5723                     i.types[op].bitfield.disp64 = 0;
5724                     i.types[op].bitfield.disp32s = 1;
5725                   }
5726                 if (i.prefix[ADDR_PREFIX]
5727                     && fits_in_unsigned_long (op_disp))
5728                   i.types[op].bitfield.disp32 = 1;
5729               }
5730             if ((i.types[op].bitfield.disp32
5731                  || i.types[op].bitfield.disp32s
5732                  || i.types[op].bitfield.disp16)
5733                 && fits_in_disp8 (op_disp))
5734               i.types[op].bitfield.disp8 = 1;
5735           }
5736         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5737                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5738           {
5739             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5740                          i.op[op].disps, 0, i.reloc[op]);
5741             i.types[op].bitfield.disp8 = 0;
5742             i.types[op].bitfield.disp16 = 0;
5743             i.types[op].bitfield.disp32 = 0;
5744             i.types[op].bitfield.disp32s = 0;
5745             i.types[op].bitfield.disp64 = 0;
5746           }
5747         else
5748           /* We only support 64bit displacement on constants.  */
5749           i.types[op].bitfield.disp64 = 0;
5750       }
5751 }
5752
5753 /* Return 1 if there is a match in broadcast bytes between operand
5754    GIVEN and instruction template T.   */
5755
5756 static INLINE int
5757 match_broadcast_size (const insn_template *t, unsigned int given)
5758 {
5759   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5760            && i.types[given].bitfield.byte)
5761           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5762               && i.types[given].bitfield.word)
5763           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5764               && i.types[given].bitfield.dword)
5765           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5766               && i.types[given].bitfield.qword));
5767 }
5768
5769 /* Check if operands are valid for the instruction.  */
5770
5771 static int
5772 check_VecOperands (const insn_template *t)
5773 {
5774   unsigned int op;
5775   i386_cpu_flags cpu;
5776
5777   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5778      any one operand are implicity requiring AVX512VL support if the actual
5779      operand size is YMMword or XMMword.  Since this function runs after
5780      template matching, there's no need to check for YMMword/XMMword in
5781      the template.  */
5782   cpu = cpu_flags_and (t->cpu_flags, avx512);
5783   if (!cpu_flags_all_zero (&cpu)
5784       && !t->cpu_flags.bitfield.cpuavx512vl
5785       && !cpu_arch_flags.bitfield.cpuavx512vl)
5786     {
5787       for (op = 0; op < t->operands; ++op)
5788         {
5789           if (t->operand_types[op].bitfield.zmmword
5790               && (i.types[op].bitfield.ymmword
5791                   || i.types[op].bitfield.xmmword))
5792             {
5793               i.error = unsupported;
5794               return 1;
5795             }
5796         }
5797     }
5798
5799   /* Without VSIB byte, we can't have a vector register for index.  */
5800   if (!t->opcode_modifier.sib
5801       && i.index_reg
5802       && (i.index_reg->reg_type.bitfield.xmmword
5803           || i.index_reg->reg_type.bitfield.ymmword
5804           || i.index_reg->reg_type.bitfield.zmmword))
5805     {
5806       i.error = unsupported_vector_index_register;
5807       return 1;
5808     }
5809
5810   /* Check if default mask is allowed.  */
5811   if (t->opcode_modifier.nodefmask
5812       && (!i.mask || i.mask->mask->reg_num == 0))
5813     {
5814       i.error = no_default_mask;
5815       return 1;
5816     }
5817
5818   /* For VSIB byte, we need a vector register for index, and all vector
5819      registers must be distinct.  */
5820   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5821     {
5822       if (!i.index_reg
5823           || !((t->opcode_modifier.sib == VECSIB128
5824                 && i.index_reg->reg_type.bitfield.xmmword)
5825                || (t->opcode_modifier.sib == VECSIB256
5826                    && i.index_reg->reg_type.bitfield.ymmword)
5827                || (t->opcode_modifier.sib == VECSIB512
5828                    && i.index_reg->reg_type.bitfield.zmmword)))
5829       {
5830         i.error = invalid_vsib_address;
5831         return 1;
5832       }
5833
5834       gas_assert (i.reg_operands == 2 || i.mask);
5835       if (i.reg_operands == 2 && !i.mask)
5836         {
5837           gas_assert (i.types[0].bitfield.class == RegSIMD);
5838           gas_assert (i.types[0].bitfield.xmmword
5839                       || i.types[0].bitfield.ymmword);
5840           gas_assert (i.types[2].bitfield.class == RegSIMD);
5841           gas_assert (i.types[2].bitfield.xmmword
5842                       || i.types[2].bitfield.ymmword);
5843           if (operand_check == check_none)
5844             return 0;
5845           if (register_number (i.op[0].regs)
5846               != register_number (i.index_reg)
5847               && register_number (i.op[2].regs)
5848                  != register_number (i.index_reg)
5849               && register_number (i.op[0].regs)
5850                  != register_number (i.op[2].regs))
5851             return 0;
5852           if (operand_check == check_error)
5853             {
5854               i.error = invalid_vector_register_set;
5855               return 1;
5856             }
5857           as_warn (_("mask, index, and destination registers should be distinct"));
5858         }
5859       else if (i.reg_operands == 1 && i.mask)
5860         {
5861           if (i.types[1].bitfield.class == RegSIMD
5862               && (i.types[1].bitfield.xmmword
5863                   || i.types[1].bitfield.ymmword
5864                   || i.types[1].bitfield.zmmword)
5865               && (register_number (i.op[1].regs)
5866                   == register_number (i.index_reg)))
5867             {
5868               if (operand_check == check_error)
5869                 {
5870                   i.error = invalid_vector_register_set;
5871                   return 1;
5872                 }
5873               if (operand_check != check_none)
5874                 as_warn (_("index and destination registers should be distinct"));
5875             }
5876         }
5877     }
5878
5879   /* For AMX instructions with three tmmword operands, all tmmword operand must be
5880      distinct */
5881   if (t->operand_types[0].bitfield.tmmword
5882       && i.reg_operands == 3)
5883     {
5884       if (register_number (i.op[0].regs)
5885           == register_number (i.op[1].regs)
5886           || register_number (i.op[0].regs)
5887              == register_number (i.op[2].regs)
5888           || register_number (i.op[1].regs)
5889              == register_number (i.op[2].regs))
5890         {
5891           i.error = invalid_tmm_register_set;
5892           return 1;
5893         }
5894     }
5895
5896   /* Check if broadcast is supported by the instruction and is applied
5897      to the memory operand.  */
5898   if (i.broadcast)
5899     {
5900       i386_operand_type type, overlap;
5901
5902       /* Check if specified broadcast is supported in this instruction,
5903          and its broadcast bytes match the memory operand.  */
5904       op = i.broadcast->operand;
5905       if (!t->opcode_modifier.broadcast
5906           || !(i.flags[op] & Operand_Mem)
5907           || (!i.types[op].bitfield.unspecified
5908               && !match_broadcast_size (t, op)))
5909         {
5910         bad_broadcast:
5911           i.error = unsupported_broadcast;
5912           return 1;
5913         }
5914
5915       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5916                             * i.broadcast->type);
5917       operand_type_set (&type, 0);
5918       switch (i.broadcast->bytes)
5919         {
5920         case 2:
5921           type.bitfield.word = 1;
5922           break;
5923         case 4:
5924           type.bitfield.dword = 1;
5925           break;
5926         case 8:
5927           type.bitfield.qword = 1;
5928           break;
5929         case 16:
5930           type.bitfield.xmmword = 1;
5931           break;
5932         case 32:
5933           type.bitfield.ymmword = 1;
5934           break;
5935         case 64:
5936           type.bitfield.zmmword = 1;
5937           break;
5938         default:
5939           goto bad_broadcast;
5940         }
5941
5942       overlap = operand_type_and (type, t->operand_types[op]);
5943       if (t->operand_types[op].bitfield.class == RegSIMD
5944           && t->operand_types[op].bitfield.byte
5945              + t->operand_types[op].bitfield.word
5946              + t->operand_types[op].bitfield.dword
5947              + t->operand_types[op].bitfield.qword > 1)
5948         {
5949           overlap.bitfield.xmmword = 0;
5950           overlap.bitfield.ymmword = 0;
5951           overlap.bitfield.zmmword = 0;
5952         }
5953       if (operand_type_all_zero (&overlap))
5954           goto bad_broadcast;
5955
5956       if (t->opcode_modifier.checkregsize)
5957         {
5958           unsigned int j;
5959
5960           type.bitfield.baseindex = 1;
5961           for (j = 0; j < i.operands; ++j)
5962             {
5963               if (j != op
5964                   && !operand_type_register_match(i.types[j],
5965                                                   t->operand_types[j],
5966                                                   type,
5967                                                   t->operand_types[op]))
5968                 goto bad_broadcast;
5969             }
5970         }
5971     }
5972   /* If broadcast is supported in this instruction, we need to check if
5973      operand of one-element size isn't specified without broadcast.  */
5974   else if (t->opcode_modifier.broadcast && i.mem_operands)
5975     {
5976       /* Find memory operand.  */
5977       for (op = 0; op < i.operands; op++)
5978         if (i.flags[op] & Operand_Mem)
5979           break;
5980       gas_assert (op < i.operands);
5981       /* Check size of the memory operand.  */
5982       if (match_broadcast_size (t, op))
5983         {
5984           i.error = broadcast_needed;
5985           return 1;
5986         }
5987     }
5988   else
5989     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5990
5991   /* Check if requested masking is supported.  */
5992   if (i.mask)
5993     {
5994       switch (t->opcode_modifier.masking)
5995         {
5996         case BOTH_MASKING:
5997           break;
5998         case MERGING_MASKING:
5999           if (i.mask->zeroing)
6000             {
6001         case 0:
6002               i.error = unsupported_masking;
6003               return 1;
6004             }
6005           break;
6006         case DYNAMIC_MASKING:
6007           /* Memory destinations allow only merging masking.  */
6008           if (i.mask->zeroing && i.mem_operands)
6009             {
6010               /* Find memory operand.  */
6011               for (op = 0; op < i.operands; op++)
6012                 if (i.flags[op] & Operand_Mem)
6013                   break;
6014               gas_assert (op < i.operands);
6015               if (op == i.operands - 1)
6016                 {
6017                   i.error = unsupported_masking;
6018                   return 1;
6019                 }
6020             }
6021           break;
6022         default:
6023           abort ();
6024         }
6025     }
6026
6027   /* Check if masking is applied to dest operand.  */
6028   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6029     {
6030       i.error = mask_not_on_destination;
6031       return 1;
6032     }
6033
6034   /* Check RC/SAE.  */
6035   if (i.rounding)
6036     {
6037       if (!t->opcode_modifier.sae
6038           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6039         {
6040           i.error = unsupported_rc_sae;
6041           return 1;
6042         }
6043       /* If the instruction has several immediate operands and one of
6044          them is rounding, the rounding operand should be the last
6045          immediate operand.  */
6046       if (i.imm_operands > 1
6047           && i.rounding->operand != (int) (i.imm_operands - 1))
6048         {
6049           i.error = rc_sae_operand_not_last_imm;
6050           return 1;
6051         }
6052     }
6053
6054   /* Check the special Imm4 cases; must be the first operand.  */
6055   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6056     {
6057       if (i.op[0].imms->X_op != O_constant
6058           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6059         {
6060           i.error = bad_imm4;
6061           return 1;
6062         }
6063
6064       /* Turn off Imm<N> so that update_imm won't complain.  */
6065       operand_type_set (&i.types[0], 0);
6066     }
6067
6068   /* Check vector Disp8 operand.  */
6069   if (t->opcode_modifier.disp8memshift
6070       && i.disp_encoding != disp_encoding_32bit)
6071     {
6072       if (i.broadcast)
6073         i.memshift = t->opcode_modifier.broadcast - 1;
6074       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6075         i.memshift = t->opcode_modifier.disp8memshift;
6076       else
6077         {
6078           const i386_operand_type *type = NULL;
6079
6080           i.memshift = 0;
6081           for (op = 0; op < i.operands; op++)
6082             if (i.flags[op] & Operand_Mem)
6083               {
6084                 if (t->opcode_modifier.evex == EVEXLIG)
6085                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6086                 else if (t->operand_types[op].bitfield.xmmword
6087                          + t->operand_types[op].bitfield.ymmword
6088                          + t->operand_types[op].bitfield.zmmword <= 1)
6089                   type = &t->operand_types[op];
6090                 else if (!i.types[op].bitfield.unspecified)
6091                   type = &i.types[op];
6092               }
6093             else if (i.types[op].bitfield.class == RegSIMD
6094                      && t->opcode_modifier.evex != EVEXLIG)
6095               {
6096                 if (i.types[op].bitfield.zmmword)
6097                   i.memshift = 6;
6098                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6099                   i.memshift = 5;
6100                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6101                   i.memshift = 4;
6102               }
6103
6104           if (type)
6105             {
6106               if (type->bitfield.zmmword)
6107                 i.memshift = 6;
6108               else if (type->bitfield.ymmword)
6109                 i.memshift = 5;
6110               else if (type->bitfield.xmmword)
6111                 i.memshift = 4;
6112             }
6113
6114           /* For the check in fits_in_disp8().  */
6115           if (i.memshift == 0)
6116             i.memshift = -1;
6117         }
6118
6119       for (op = 0; op < i.operands; op++)
6120         if (operand_type_check (i.types[op], disp)
6121             && i.op[op].disps->X_op == O_constant)
6122           {
6123             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6124               {
6125                 i.types[op].bitfield.disp8 = 1;
6126                 return 0;
6127               }
6128             i.types[op].bitfield.disp8 = 0;
6129           }
6130     }
6131
6132   i.memshift = 0;
6133
6134   return 0;
6135 }
6136
6137 /* Check if encoding requirements are met by the instruction.  */
6138
6139 static int
6140 VEX_check_encoding (const insn_template *t)
6141 {
6142   if (i.vec_encoding == vex_encoding_error)
6143     {
6144       i.error = unsupported;
6145       return 1;
6146     }
6147
6148   if (i.vec_encoding == vex_encoding_evex)
6149     {
6150       /* This instruction must be encoded with EVEX prefix.  */
6151       if (!is_evex_encoding (t))
6152         {
6153           i.error = unsupported;
6154           return 1;
6155         }
6156       return 0;
6157     }
6158
6159   if (!t->opcode_modifier.vex)
6160     {
6161       /* This instruction template doesn't have VEX prefix.  */
6162       if (i.vec_encoding != vex_encoding_default)
6163         {
6164           i.error = unsupported;
6165           return 1;
6166         }
6167       return 0;
6168     }
6169
6170   return 0;
6171 }
6172
6173 static const insn_template *
6174 match_template (char mnem_suffix)
6175 {
6176   /* Points to template once we've found it.  */
6177   const insn_template *t;
6178   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6179   i386_operand_type overlap4;
6180   unsigned int found_reverse_match;
6181   i386_opcode_modifier suffix_check;
6182   i386_operand_type operand_types [MAX_OPERANDS];
6183   int addr_prefix_disp;
6184   unsigned int j, size_match, check_register;
6185   enum i386_error specific_error = 0;
6186
6187 #if MAX_OPERANDS != 5
6188 # error "MAX_OPERANDS must be 5."
6189 #endif
6190
6191   found_reverse_match = 0;
6192   addr_prefix_disp = -1;
6193
6194   /* Prepare for mnemonic suffix check.  */
6195   memset (&suffix_check, 0, sizeof (suffix_check));
6196   switch (mnem_suffix)
6197     {
6198     case BYTE_MNEM_SUFFIX:
6199       suffix_check.no_bsuf = 1;
6200       break;
6201     case WORD_MNEM_SUFFIX:
6202       suffix_check.no_wsuf = 1;
6203       break;
6204     case SHORT_MNEM_SUFFIX:
6205       suffix_check.no_ssuf = 1;
6206       break;
6207     case LONG_MNEM_SUFFIX:
6208       suffix_check.no_lsuf = 1;
6209       break;
6210     case QWORD_MNEM_SUFFIX:
6211       suffix_check.no_qsuf = 1;
6212       break;
6213     default:
6214       /* NB: In Intel syntax, normally we can check for memory operand
6215          size when there is no mnemonic suffix.  But jmp and call have
6216          2 different encodings with Dword memory operand size, one with
6217          No_ldSuf and the other without.  i.suffix is set to
6218          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6219       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6220         suffix_check.no_ldsuf = 1;
6221     }
6222
6223   /* Must have right number of operands.  */
6224   i.error = number_of_operands_mismatch;
6225
6226   for (t = current_templates->start; t < current_templates->end; t++)
6227     {
6228       addr_prefix_disp = -1;
6229       found_reverse_match = 0;
6230
6231       if (i.operands != t->operands)
6232         continue;
6233
6234       /* Check processor support.  */
6235       i.error = unsupported;
6236       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6237         continue;
6238
6239       /* Check Pseudo Prefix.  */
6240       i.error = unsupported;
6241       if (t->opcode_modifier.pseudovexprefix
6242           && !(i.vec_encoding == vex_encoding_vex
6243               || i.vec_encoding == vex_encoding_vex3))
6244         continue;
6245
6246       /* Check AT&T mnemonic.   */
6247       i.error = unsupported_with_intel_mnemonic;
6248       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6249         continue;
6250
6251       /* Check AT&T/Intel syntax.  */
6252       i.error = unsupported_syntax;
6253       if ((intel_syntax && t->opcode_modifier.attsyntax)
6254           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6255         continue;
6256
6257       /* Check Intel64/AMD64 ISA.   */
6258       switch (isa64)
6259         {
6260         default:
6261           /* Default: Don't accept Intel64.  */
6262           if (t->opcode_modifier.isa64 == INTEL64)
6263             continue;
6264           break;
6265         case amd64:
6266           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6267           if (t->opcode_modifier.isa64 >= INTEL64)
6268             continue;
6269           break;
6270         case intel64:
6271           /* -mintel64: Don't accept AMD64.  */
6272           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6273             continue;
6274           break;
6275         }
6276
6277       /* Check the suffix.  */
6278       i.error = invalid_instruction_suffix;
6279       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6280           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6281           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6282           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6283           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6284           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6285         continue;
6286
6287       size_match = operand_size_match (t);
6288       if (!size_match)
6289         continue;
6290
6291       /* This is intentionally not
6292
6293          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6294
6295          as the case of a missing * on the operand is accepted (perhaps with
6296          a warning, issued further down).  */
6297       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6298         {
6299           i.error = operand_type_mismatch;
6300           continue;
6301         }
6302
6303       for (j = 0; j < MAX_OPERANDS; j++)
6304         operand_types[j] = t->operand_types[j];
6305
6306       /* In general, don't allow
6307          - 64-bit operands outside of 64-bit mode,
6308          - 32-bit operands on pre-386.  */
6309       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6310       if (((i.suffix == QWORD_MNEM_SUFFIX
6311             && flag_code != CODE_64BIT
6312             && !(t->base_opcode == 0xfc7
6313                  && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
6314                  && t->extension_opcode == 1) /* cmpxchg8b */)
6315            || (i.suffix == LONG_MNEM_SUFFIX
6316                && !cpu_arch_flags.bitfield.cpui386))
6317           && (intel_syntax
6318               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6319                  && !intel_float_operand (t->name))
6320               : intel_float_operand (t->name) != 2)
6321           && (t->operands == i.imm_operands
6322               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6323                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6324                && operand_types[i.imm_operands].bitfield.class != RegMask)
6325               || (operand_types[j].bitfield.class != RegMMX
6326                   && operand_types[j].bitfield.class != RegSIMD
6327                   && operand_types[j].bitfield.class != RegMask))
6328           && !t->opcode_modifier.sib)
6329         continue;
6330
6331       /* Do not verify operands when there are none.  */
6332       if (!t->operands)
6333         {
6334           if (VEX_check_encoding (t))
6335             {
6336               specific_error = i.error;
6337               continue;
6338             }
6339
6340           /* We've found a match; break out of loop.  */
6341           break;
6342         }
6343
6344       if (!t->opcode_modifier.jump
6345           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6346         {
6347           /* There should be only one Disp operand.  */
6348           for (j = 0; j < MAX_OPERANDS; j++)
6349             if (operand_type_check (operand_types[j], disp))
6350               break;
6351           if (j < MAX_OPERANDS)
6352             {
6353               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6354
6355               addr_prefix_disp = j;
6356
6357               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6358                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6359               switch (flag_code)
6360                 {
6361                 case CODE_16BIT:
6362                   override = !override;
6363                   /* Fall through.  */
6364                 case CODE_32BIT:
6365                   if (operand_types[j].bitfield.disp32
6366                       && operand_types[j].bitfield.disp16)
6367                     {
6368                       operand_types[j].bitfield.disp16 = override;
6369                       operand_types[j].bitfield.disp32 = !override;
6370                     }
6371                   operand_types[j].bitfield.disp32s = 0;
6372                   operand_types[j].bitfield.disp64 = 0;
6373                   break;
6374
6375                 case CODE_64BIT:
6376                   if (operand_types[j].bitfield.disp32s
6377                       || operand_types[j].bitfield.disp64)
6378                     {
6379                       operand_types[j].bitfield.disp64 &= !override;
6380                       operand_types[j].bitfield.disp32s &= !override;
6381                       operand_types[j].bitfield.disp32 = override;
6382                     }
6383                   operand_types[j].bitfield.disp16 = 0;
6384                   break;
6385                 }
6386             }
6387         }
6388
6389       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6390       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6391         continue;
6392
6393       /* We check register size if needed.  */
6394       if (t->opcode_modifier.checkregsize)
6395         {
6396           check_register = (1 << t->operands) - 1;
6397           if (i.broadcast)
6398             check_register &= ~(1 << i.broadcast->operand);
6399         }
6400       else
6401         check_register = 0;
6402
6403       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6404       switch (t->operands)
6405         {
6406         case 1:
6407           if (!operand_type_match (overlap0, i.types[0]))
6408             continue;
6409           break;
6410         case 2:
6411           /* xchg %eax, %eax is a special case. It is an alias for nop
6412              only in 32bit mode and we can use opcode 0x90.  In 64bit
6413              mode, we can't use 0x90 for xchg %eax, %eax since it should
6414              zero-extend %eax to %rax.  */
6415           if (flag_code == CODE_64BIT
6416               && t->base_opcode == 0x90
6417               && i.types[0].bitfield.instance == Accum
6418               && i.types[0].bitfield.dword
6419               && i.types[1].bitfield.instance == Accum
6420               && i.types[1].bitfield.dword)
6421             continue;
6422           /* xrelease mov %eax, <disp> is another special case. It must not
6423              match the accumulator-only encoding of mov.  */
6424           if (flag_code != CODE_64BIT
6425               && i.hle_prefix
6426               && t->base_opcode == 0xa0
6427               && i.types[0].bitfield.instance == Accum
6428               && (i.flags[1] & Operand_Mem))
6429             continue;
6430           /* Fall through.  */
6431
6432         case 3:
6433           if (!(size_match & MATCH_STRAIGHT))
6434             goto check_reverse;
6435           /* Reverse direction of operands if swapping is possible in the first
6436              place (operands need to be symmetric) and
6437              - the load form is requested, and the template is a store form,
6438              - the store form is requested, and the template is a load form,
6439              - the non-default (swapped) form is requested.  */
6440           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6441           if (t->opcode_modifier.d && i.reg_operands == i.operands
6442               && !operand_type_all_zero (&overlap1))
6443             switch (i.dir_encoding)
6444               {
6445               case dir_encoding_load:
6446                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6447                     || t->opcode_modifier.regmem)
6448                   goto check_reverse;
6449                 break;
6450
6451               case dir_encoding_store:
6452                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6453                     && !t->opcode_modifier.regmem)
6454                   goto check_reverse;
6455                 break;
6456
6457               case dir_encoding_swap:
6458                 goto check_reverse;
6459
6460               case dir_encoding_default:
6461                 break;
6462               }
6463           /* If we want store form, we skip the current load.  */
6464           if ((i.dir_encoding == dir_encoding_store
6465                || i.dir_encoding == dir_encoding_swap)
6466               && i.mem_operands == 0
6467               && t->opcode_modifier.load)
6468             continue;
6469           /* Fall through.  */
6470         case 4:
6471         case 5:
6472           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6473           if (!operand_type_match (overlap0, i.types[0])
6474               || !operand_type_match (overlap1, i.types[1])
6475               || ((check_register & 3) == 3
6476                   && !operand_type_register_match (i.types[0],
6477                                                    operand_types[0],
6478                                                    i.types[1],
6479                                                    operand_types[1])))
6480             {
6481               /* Check if other direction is valid ...  */
6482               if (!t->opcode_modifier.d)
6483                 continue;
6484
6485             check_reverse:
6486               if (!(size_match & MATCH_REVERSE))
6487                 continue;
6488               /* Try reversing direction of operands.  */
6489               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6490               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6491               if (!operand_type_match (overlap0, i.types[0])
6492                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6493                   || (check_register
6494                       && !operand_type_register_match (i.types[0],
6495                                                        operand_types[i.operands - 1],
6496                                                        i.types[i.operands - 1],
6497                                                        operand_types[0])))
6498                 {
6499                   /* Does not match either direction.  */
6500                   continue;
6501                 }
6502               /* found_reverse_match holds which of D or FloatR
6503                  we've found.  */
6504               if (!t->opcode_modifier.d)
6505                 found_reverse_match = 0;
6506               else if (operand_types[0].bitfield.tbyte)
6507                 found_reverse_match = Opcode_FloatD;
6508               else if (operand_types[0].bitfield.xmmword
6509                        || operand_types[i.operands - 1].bitfield.xmmword
6510                        || operand_types[0].bitfield.class == RegMMX
6511                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6512                        || is_any_vex_encoding(t))
6513                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6514                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6515               else
6516                 found_reverse_match = Opcode_D;
6517               if (t->opcode_modifier.floatr)
6518                 found_reverse_match |= Opcode_FloatR;
6519             }
6520           else
6521             {
6522               /* Found a forward 2 operand match here.  */
6523               switch (t->operands)
6524                 {
6525                 case 5:
6526                   overlap4 = operand_type_and (i.types[4],
6527                                                operand_types[4]);
6528                   /* Fall through.  */
6529                 case 4:
6530                   overlap3 = operand_type_and (i.types[3],
6531                                                operand_types[3]);
6532                   /* Fall through.  */
6533                 case 3:
6534                   overlap2 = operand_type_and (i.types[2],
6535                                                operand_types[2]);
6536                   break;
6537                 }
6538
6539               switch (t->operands)
6540                 {
6541                 case 5:
6542                   if (!operand_type_match (overlap4, i.types[4])
6543                       || !operand_type_register_match (i.types[3],
6544                                                        operand_types[3],
6545                                                        i.types[4],
6546                                                        operand_types[4]))
6547                     continue;
6548                   /* Fall through.  */
6549                 case 4:
6550                   if (!operand_type_match (overlap3, i.types[3])
6551                       || ((check_register & 0xa) == 0xa
6552                           && !operand_type_register_match (i.types[1],
6553                                                             operand_types[1],
6554                                                             i.types[3],
6555                                                             operand_types[3]))
6556                       || ((check_register & 0xc) == 0xc
6557                           && !operand_type_register_match (i.types[2],
6558                                                             operand_types[2],
6559                                                             i.types[3],
6560                                                             operand_types[3])))
6561                     continue;
6562                   /* Fall through.  */
6563                 case 3:
6564                   /* Here we make use of the fact that there are no
6565                      reverse match 3 operand instructions.  */
6566                   if (!operand_type_match (overlap2, i.types[2])
6567                       || ((check_register & 5) == 5
6568                           && !operand_type_register_match (i.types[0],
6569                                                             operand_types[0],
6570                                                             i.types[2],
6571                                                             operand_types[2]))
6572                       || ((check_register & 6) == 6
6573                           && !operand_type_register_match (i.types[1],
6574                                                             operand_types[1],
6575                                                             i.types[2],
6576                                                             operand_types[2])))
6577                     continue;
6578                   break;
6579                 }
6580             }
6581           /* Found either forward/reverse 2, 3 or 4 operand match here:
6582              slip through to break.  */
6583         }
6584
6585       /* Check if vector operands are valid.  */
6586       if (check_VecOperands (t))
6587         {
6588           specific_error = i.error;
6589           continue;
6590         }
6591
6592       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6593       if (VEX_check_encoding (t))
6594         {
6595           specific_error = i.error;
6596           continue;
6597         }
6598
6599       /* We've found a match; break out of loop.  */
6600       break;
6601     }
6602
6603   if (t == current_templates->end)
6604     {
6605       /* We found no match.  */
6606       const char *err_msg;
6607       switch (specific_error ? specific_error : i.error)
6608         {
6609         default:
6610           abort ();
6611         case operand_size_mismatch:
6612           err_msg = _("operand size mismatch");
6613           break;
6614         case operand_type_mismatch:
6615           err_msg = _("operand type mismatch");
6616           break;
6617         case register_type_mismatch:
6618           err_msg = _("register type mismatch");
6619           break;
6620         case number_of_operands_mismatch:
6621           err_msg = _("number of operands mismatch");
6622           break;
6623         case invalid_instruction_suffix:
6624           err_msg = _("invalid instruction suffix");
6625           break;
6626         case bad_imm4:
6627           err_msg = _("constant doesn't fit in 4 bits");
6628           break;
6629         case unsupported_with_intel_mnemonic:
6630           err_msg = _("unsupported with Intel mnemonic");
6631           break;
6632         case unsupported_syntax:
6633           err_msg = _("unsupported syntax");
6634           break;
6635         case unsupported:
6636           as_bad (_("unsupported instruction `%s'"),
6637                   current_templates->start->name);
6638           return NULL;
6639         case invalid_sib_address:
6640           err_msg = _("invalid SIB address");
6641           break;
6642         case invalid_vsib_address:
6643           err_msg = _("invalid VSIB address");
6644           break;
6645         case invalid_vector_register_set:
6646           err_msg = _("mask, index, and destination registers must be distinct");
6647           break;
6648         case invalid_tmm_register_set:
6649           err_msg = _("all tmm registers must be distinct");
6650           break;
6651         case unsupported_vector_index_register:
6652           err_msg = _("unsupported vector index register");
6653           break;
6654         case unsupported_broadcast:
6655           err_msg = _("unsupported broadcast");
6656           break;
6657         case broadcast_needed:
6658           err_msg = _("broadcast is needed for operand of such type");
6659           break;
6660         case unsupported_masking:
6661           err_msg = _("unsupported masking");
6662           break;
6663         case mask_not_on_destination:
6664           err_msg = _("mask not on destination operand");
6665           break;
6666         case no_default_mask:
6667           err_msg = _("default mask isn't allowed");
6668           break;
6669         case unsupported_rc_sae:
6670           err_msg = _("unsupported static rounding/sae");
6671           break;
6672         case rc_sae_operand_not_last_imm:
6673           if (intel_syntax)
6674             err_msg = _("RC/SAE operand must precede immediate operands");
6675           else
6676             err_msg = _("RC/SAE operand must follow immediate operands");
6677           break;
6678         case invalid_register_operand:
6679           err_msg = _("invalid register operand");
6680           break;
6681         }
6682       as_bad (_("%s for `%s'"), err_msg,
6683               current_templates->start->name);
6684       return NULL;
6685     }
6686
6687   if (!quiet_warnings)
6688     {
6689       if (!intel_syntax
6690           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6691         as_warn (_("indirect %s without `*'"), t->name);
6692
6693       if (t->opcode_modifier.isprefix
6694           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6695         {
6696           /* Warn them that a data or address size prefix doesn't
6697              affect assembly of the next line of code.  */
6698           as_warn (_("stand-alone `%s' prefix"), t->name);
6699         }
6700     }
6701
6702   /* Copy the template we found.  */
6703   i.tm = *t;
6704
6705   if (addr_prefix_disp != -1)
6706     i.tm.operand_types[addr_prefix_disp]
6707       = operand_types[addr_prefix_disp];
6708
6709   if (found_reverse_match)
6710     {
6711       /* If we found a reverse match we must alter the opcode direction
6712          bit and clear/flip the regmem modifier one.  found_reverse_match
6713          holds bits to change (different for int & float insns).  */
6714
6715       i.tm.base_opcode ^= found_reverse_match;
6716
6717       i.tm.operand_types[0] = operand_types[i.operands - 1];
6718       i.tm.operand_types[i.operands - 1] = operand_types[0];
6719
6720       /* Certain SIMD insns have their load forms specified in the opcode
6721          table, and hence we need to _set_ RegMem instead of clearing it.
6722          We need to avoid setting the bit though on insns like KMOVW.  */
6723       i.tm.opcode_modifier.regmem
6724         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6725           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6726           && !i.tm.opcode_modifier.regmem;
6727     }
6728
6729   return t;
6730 }
6731
6732 static int
6733 check_string (void)
6734 {
6735   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6736   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6737
6738   if (i.seg[op] != NULL && i.seg[op] != &es)
6739     {
6740       as_bad (_("`%s' operand %u must use `%ses' segment"),
6741               i.tm.name,
6742               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6743               register_prefix);
6744       return 0;
6745     }
6746
6747   /* There's only ever one segment override allowed per instruction.
6748      This instruction possibly has a legal segment override on the
6749      second operand, so copy the segment to where non-string
6750      instructions store it, allowing common code.  */
6751   i.seg[op] = i.seg[1];
6752
6753   return 1;
6754 }
6755
6756 static int
6757 process_suffix (void)
6758 {
6759   bfd_boolean is_crc32 = FALSE;
6760
6761   /* If matched instruction specifies an explicit instruction mnemonic
6762      suffix, use it.  */
6763   if (i.tm.opcode_modifier.size == SIZE16)
6764     i.suffix = WORD_MNEM_SUFFIX;
6765   else if (i.tm.opcode_modifier.size == SIZE32)
6766     i.suffix = LONG_MNEM_SUFFIX;
6767   else if (i.tm.opcode_modifier.size == SIZE64)
6768     i.suffix = QWORD_MNEM_SUFFIX;
6769   else if (i.reg_operands
6770            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6771            && !i.tm.opcode_modifier.addrprefixopreg)
6772     {
6773       unsigned int numop = i.operands;
6774       /* CRC32 */
6775       is_crc32 = (i.tm.base_opcode == 0xf38f0
6776                   && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6777
6778       /* movsx/movzx want only their source operand considered here, for the
6779          ambiguity checking below.  The suffix will be replaced afterwards
6780          to represent the destination (register).  */
6781       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6782           || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6783         --i.operands;
6784
6785       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6786       if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
6787         i.rex |= REX_W;
6788
6789       /* If there's no instruction mnemonic suffix we try to invent one
6790          based on GPR operands.  */
6791       if (!i.suffix)
6792         {
6793           /* We take i.suffix from the last register operand specified,
6794              Destination register type is more significant than source
6795              register type.  crc32 in SSE4.2 prefers source register
6796              type. */
6797           unsigned int op = is_crc32 ? 1 : i.operands;
6798
6799           while (op--)
6800             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6801                 || i.tm.operand_types[op].bitfield.instance == Accum)
6802               {
6803                 if (i.types[op].bitfield.class != Reg)
6804                   continue;
6805                 if (i.types[op].bitfield.byte)
6806                   i.suffix = BYTE_MNEM_SUFFIX;
6807                 else if (i.types[op].bitfield.word)
6808                   i.suffix = WORD_MNEM_SUFFIX;
6809                 else if (i.types[op].bitfield.dword)
6810                   i.suffix = LONG_MNEM_SUFFIX;
6811                 else if (i.types[op].bitfield.qword)
6812                   i.suffix = QWORD_MNEM_SUFFIX;
6813                 else
6814                   continue;
6815                 break;
6816               }
6817
6818           /* As an exception, movsx/movzx silently default to a byte source
6819              in AT&T mode.  */
6820           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6821               && !i.suffix && !intel_syntax)
6822             i.suffix = BYTE_MNEM_SUFFIX;
6823         }
6824       else if (i.suffix == BYTE_MNEM_SUFFIX)
6825         {
6826           if (intel_syntax
6827               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6828               && i.tm.opcode_modifier.no_bsuf)
6829             i.suffix = 0;
6830           else if (!check_byte_reg ())
6831             return 0;
6832         }
6833       else if (i.suffix == LONG_MNEM_SUFFIX)
6834         {
6835           if (intel_syntax
6836               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6837               && i.tm.opcode_modifier.no_lsuf
6838               && !i.tm.opcode_modifier.todword
6839               && !i.tm.opcode_modifier.toqword)
6840             i.suffix = 0;
6841           else if (!check_long_reg ())
6842             return 0;
6843         }
6844       else if (i.suffix == QWORD_MNEM_SUFFIX)
6845         {
6846           if (intel_syntax
6847               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6848               && i.tm.opcode_modifier.no_qsuf
6849               && !i.tm.opcode_modifier.todword
6850               && !i.tm.opcode_modifier.toqword)
6851             i.suffix = 0;
6852           else if (!check_qword_reg ())
6853             return 0;
6854         }
6855       else if (i.suffix == WORD_MNEM_SUFFIX)
6856         {
6857           if (intel_syntax
6858               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6859               && i.tm.opcode_modifier.no_wsuf)
6860             i.suffix = 0;
6861           else if (!check_word_reg ())
6862             return 0;
6863         }
6864       else if (intel_syntax
6865                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6866         /* Do nothing if the instruction is going to ignore the prefix.  */
6867         ;
6868       else
6869         abort ();
6870
6871       /* Undo the movsx/movzx change done above.  */
6872       i.operands = numop;
6873     }
6874   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6875            && !i.suffix)
6876     {
6877       i.suffix = stackop_size;
6878       if (stackop_size == LONG_MNEM_SUFFIX)
6879         {
6880           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6881              .code16gcc directive to support 16-bit mode with
6882              32-bit address.  For IRET without a suffix, generate
6883              16-bit IRET (opcode 0xcf) to return from an interrupt
6884              handler.  */
6885           if (i.tm.base_opcode == 0xcf)
6886             {
6887               i.suffix = WORD_MNEM_SUFFIX;
6888               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6889             }
6890           /* Warn about changed behavior for segment register push/pop.  */
6891           else if ((i.tm.base_opcode | 1) == 0x07)
6892             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6893                      i.tm.name);
6894         }
6895     }
6896   else if (!i.suffix
6897            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6898                || i.tm.opcode_modifier.jump == JUMP_BYTE
6899                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6900                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6901                    && i.tm.extension_opcode <= 3)))
6902     {
6903       switch (flag_code)
6904         {
6905         case CODE_64BIT:
6906           if (!i.tm.opcode_modifier.no_qsuf)
6907             {
6908               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6909                   || i.tm.opcode_modifier.no_lsuf)
6910                 i.suffix = QWORD_MNEM_SUFFIX;
6911               break;
6912             }
6913           /* Fall through.  */
6914         case CODE_32BIT:
6915           if (!i.tm.opcode_modifier.no_lsuf)
6916             i.suffix = LONG_MNEM_SUFFIX;
6917           break;
6918         case CODE_16BIT:
6919           if (!i.tm.opcode_modifier.no_wsuf)
6920             i.suffix = WORD_MNEM_SUFFIX;
6921           break;
6922         }
6923     }
6924
6925   if (!i.suffix
6926       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6927           /* Also cover lret/retf/iret in 64-bit mode.  */
6928           || (flag_code == CODE_64BIT
6929               && !i.tm.opcode_modifier.no_lsuf
6930               && !i.tm.opcode_modifier.no_qsuf))
6931       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6932       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6933       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6934       /* Accept FLDENV et al without suffix.  */
6935       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6936     {
6937       unsigned int suffixes, evex = 0;
6938
6939       suffixes = !i.tm.opcode_modifier.no_bsuf;
6940       if (!i.tm.opcode_modifier.no_wsuf)
6941         suffixes |= 1 << 1;
6942       if (!i.tm.opcode_modifier.no_lsuf)
6943         suffixes |= 1 << 2;
6944       if (!i.tm.opcode_modifier.no_ldsuf)
6945         suffixes |= 1 << 3;
6946       if (!i.tm.opcode_modifier.no_ssuf)
6947         suffixes |= 1 << 4;
6948       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6949         suffixes |= 1 << 5;
6950
6951       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6952          also suitable for AT&T syntax mode, it was requested that this be
6953          restricted to just Intel syntax.  */
6954       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6955         {
6956           unsigned int op;
6957
6958           for (op = 0; op < i.tm.operands; ++op)
6959             {
6960               if (is_evex_encoding (&i.tm)
6961                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6962                 {
6963                   if (i.tm.operand_types[op].bitfield.ymmword)
6964                     i.tm.operand_types[op].bitfield.xmmword = 0;
6965                   if (i.tm.operand_types[op].bitfield.zmmword)
6966                     i.tm.operand_types[op].bitfield.ymmword = 0;
6967                   if (!i.tm.opcode_modifier.evex
6968                       || i.tm.opcode_modifier.evex == EVEXDYN)
6969                     i.tm.opcode_modifier.evex = EVEX512;
6970                 }
6971
6972               if (i.tm.operand_types[op].bitfield.xmmword
6973                   + i.tm.operand_types[op].bitfield.ymmword
6974                   + i.tm.operand_types[op].bitfield.zmmword < 2)
6975                 continue;
6976
6977               /* Any properly sized operand disambiguates the insn.  */
6978               if (i.types[op].bitfield.xmmword
6979                   || i.types[op].bitfield.ymmword
6980                   || i.types[op].bitfield.zmmword)
6981                 {
6982                   suffixes &= ~(7 << 6);
6983                   evex = 0;
6984                   break;
6985                 }
6986
6987               if ((i.flags[op] & Operand_Mem)
6988                   && i.tm.operand_types[op].bitfield.unspecified)
6989                 {
6990                   if (i.tm.operand_types[op].bitfield.xmmword)
6991                     suffixes |= 1 << 6;
6992                   if (i.tm.operand_types[op].bitfield.ymmword)
6993                     suffixes |= 1 << 7;
6994                   if (i.tm.operand_types[op].bitfield.zmmword)
6995                     suffixes |= 1 << 8;
6996                   if (is_evex_encoding (&i.tm))
6997                     evex = EVEX512;
6998                 }
6999             }
7000         }
7001
7002       /* Are multiple suffixes / operand sizes allowed?  */
7003       if (suffixes & (suffixes - 1))
7004         {
7005           if (intel_syntax
7006               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7007                   || operand_check == check_error))
7008             {
7009               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
7010               return 0;
7011             }
7012           if (operand_check == check_error)
7013             {
7014               as_bad (_("no instruction mnemonic suffix given and "
7015                         "no register operands; can't size `%s'"), i.tm.name);
7016               return 0;
7017             }
7018           if (operand_check == check_warning)
7019             as_warn (_("%s; using default for `%s'"),
7020                        intel_syntax
7021                        ? _("ambiguous operand size")
7022                        : _("no instruction mnemonic suffix given and "
7023                            "no register operands"),
7024                        i.tm.name);
7025
7026           if (i.tm.opcode_modifier.floatmf)
7027             i.suffix = SHORT_MNEM_SUFFIX;
7028           else if ((i.tm.base_opcode | 8) == 0xfbe
7029                    || (i.tm.base_opcode == 0x63
7030                        && i.tm.cpu_flags.bitfield.cpu64))
7031             /* handled below */;
7032           else if (evex)
7033             i.tm.opcode_modifier.evex = evex;
7034           else if (flag_code == CODE_16BIT)
7035             i.suffix = WORD_MNEM_SUFFIX;
7036           else if (!i.tm.opcode_modifier.no_lsuf)
7037             i.suffix = LONG_MNEM_SUFFIX;
7038           else
7039             i.suffix = QWORD_MNEM_SUFFIX;
7040         }
7041     }
7042
7043   if ((i.tm.base_opcode | 8) == 0xfbe
7044       || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7045     {
7046       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7047          In AT&T syntax, if there is no suffix (warned about above), the default
7048          will be byte extension.  */
7049       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7050         i.tm.base_opcode |= 1;
7051
7052       /* For further processing, the suffix should represent the destination
7053          (register).  This is already the case when one was used with
7054          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7055          no suffix to begin with.  */
7056       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7057         {
7058           if (i.types[1].bitfield.word)
7059             i.suffix = WORD_MNEM_SUFFIX;
7060           else if (i.types[1].bitfield.qword)
7061             i.suffix = QWORD_MNEM_SUFFIX;
7062           else
7063             i.suffix = LONG_MNEM_SUFFIX;
7064
7065           i.tm.opcode_modifier.w = 0;
7066         }
7067     }
7068
7069   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7070     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7071                    != (i.tm.operand_types[1].bitfield.class == Reg);
7072
7073   /* Change the opcode based on the operand size given by i.suffix.  */
7074   switch (i.suffix)
7075     {
7076     /* Size floating point instruction.  */
7077     case LONG_MNEM_SUFFIX:
7078       if (i.tm.opcode_modifier.floatmf)
7079         {
7080           i.tm.base_opcode ^= 4;
7081           break;
7082         }
7083     /* fall through */
7084     case WORD_MNEM_SUFFIX:
7085     case QWORD_MNEM_SUFFIX:
7086       /* It's not a byte, select word/dword operation.  */
7087       if (i.tm.opcode_modifier.w)
7088         {
7089           if (i.short_form)
7090             i.tm.base_opcode |= 8;
7091           else
7092             i.tm.base_opcode |= 1;
7093         }
7094     /* fall through */
7095     case SHORT_MNEM_SUFFIX:
7096       /* Now select between word & dword operations via the operand
7097          size prefix, except for instructions that will ignore this
7098          prefix anyway.  */
7099       if (i.suffix != QWORD_MNEM_SUFFIX
7100           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7101           && !i.tm.opcode_modifier.floatmf
7102           && !is_any_vex_encoding (&i.tm)
7103           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7104               || (flag_code == CODE_64BIT
7105                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7106         {
7107           unsigned int prefix = DATA_PREFIX_OPCODE;
7108
7109           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7110             prefix = ADDR_PREFIX_OPCODE;
7111
7112           if (!add_prefix (prefix))
7113             return 0;
7114         }
7115
7116       /* Set mode64 for an operand.  */
7117       if (i.suffix == QWORD_MNEM_SUFFIX
7118           && flag_code == CODE_64BIT
7119           && !i.tm.opcode_modifier.norex64
7120           && !i.tm.opcode_modifier.vexw
7121           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7122              need rex64. */
7123           && ! (i.operands == 2
7124                 && i.tm.base_opcode == 0x90
7125                 && i.tm.extension_opcode == None
7126                 && i.types[0].bitfield.instance == Accum
7127                 && i.types[0].bitfield.qword
7128                 && i.types[1].bitfield.instance == Accum
7129                 && i.types[1].bitfield.qword))
7130         i.rex |= REX_W;
7131
7132       break;
7133
7134     case 0:
7135       /* Select word/dword/qword operation with explicit data sizing prefix
7136          when there are no suitable register operands.  */
7137       if (i.tm.opcode_modifier.w
7138           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7139           && (!i.reg_operands
7140               || (i.reg_operands == 1
7141                       /* ShiftCount */
7142                   && (i.tm.operand_types[0].bitfield.instance == RegC
7143                       /* InOutPortReg */
7144                       || i.tm.operand_types[0].bitfield.instance == RegD
7145                       || i.tm.operand_types[1].bitfield.instance == RegD
7146                       /* CRC32 */
7147                       || is_crc32))))
7148         i.tm.base_opcode |= 1;
7149       break;
7150     }
7151
7152   if (i.tm.opcode_modifier.addrprefixopreg)
7153     {
7154       gas_assert (!i.suffix);
7155       gas_assert (i.reg_operands);
7156
7157       if (i.tm.operand_types[0].bitfield.instance == Accum
7158           || i.operands == 1)
7159         {
7160           /* The address size override prefix changes the size of the
7161              first operand.  */
7162           if (flag_code == CODE_64BIT
7163               && i.op[0].regs->reg_type.bitfield.word)
7164             {
7165               as_bad (_("16-bit addressing unavailable for `%s'"),
7166                       i.tm.name);
7167               return 0;
7168             }
7169
7170           if ((flag_code == CODE_32BIT
7171                ? i.op[0].regs->reg_type.bitfield.word
7172                : i.op[0].regs->reg_type.bitfield.dword)
7173               && !add_prefix (ADDR_PREFIX_OPCODE))
7174             return 0;
7175         }
7176       else
7177         {
7178           /* Check invalid register operand when the address size override
7179              prefix changes the size of register operands.  */
7180           unsigned int op;
7181           enum { need_word, need_dword, need_qword } need;
7182
7183           /* Check the register operand for the address size prefix if
7184              the memory operand has no real registers, like symbol, DISP
7185              or symbol(%rip).  */
7186           if (i.mem_operands == 1
7187               && i.reg_operands == 1
7188               && i.operands == 2
7189               && i.types[1].bitfield.class == Reg
7190               && (flag_code == CODE_32BIT
7191                   ? i.op[1].regs->reg_type.bitfield.word
7192                   : i.op[1].regs->reg_type.bitfield.dword)
7193               && ((i.base_reg == NULL && i.index_reg == NULL)
7194                   || (i.base_reg
7195                       && i.base_reg->reg_num == RegIP
7196                       && i.base_reg->reg_type.bitfield.qword))
7197               && !add_prefix (ADDR_PREFIX_OPCODE))
7198             return 0;
7199
7200           if (flag_code == CODE_32BIT)
7201             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7202           else if (i.prefix[ADDR_PREFIX])
7203             need = need_dword;
7204           else
7205             need = flag_code == CODE_64BIT ? need_qword : need_word;
7206
7207           for (op = 0; op < i.operands; op++)
7208             {
7209               if (i.types[op].bitfield.class != Reg)
7210                 continue;
7211
7212               switch (need)
7213                 {
7214                 case need_word:
7215                   if (i.op[op].regs->reg_type.bitfield.word)
7216                     continue;
7217                   break;
7218                 case need_dword:
7219                   if (i.op[op].regs->reg_type.bitfield.dword)
7220                     continue;
7221                   break;
7222                 case need_qword:
7223                   if (i.op[op].regs->reg_type.bitfield.qword)
7224                     continue;
7225                   break;
7226                 }
7227
7228               as_bad (_("invalid register operand size for `%s'"),
7229                       i.tm.name);
7230               return 0;
7231             }
7232         }
7233     }
7234
7235   return 1;
7236 }
7237
7238 static int
7239 check_byte_reg (void)
7240 {
7241   int op;
7242
7243   for (op = i.operands; --op >= 0;)
7244     {
7245       /* Skip non-register operands. */
7246       if (i.types[op].bitfield.class != Reg)
7247         continue;
7248
7249       /* If this is an eight bit register, it's OK.  If it's the 16 or
7250          32 bit version of an eight bit register, we will just use the
7251          low portion, and that's OK too.  */
7252       if (i.types[op].bitfield.byte)
7253         continue;
7254
7255       /* I/O port address operands are OK too.  */
7256       if (i.tm.operand_types[op].bitfield.instance == RegD
7257           && i.tm.operand_types[op].bitfield.word)
7258         continue;
7259
7260       /* crc32 only wants its source operand checked here.  */
7261       if (i.tm.base_opcode == 0xf38f0
7262           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7263           && op != 0)
7264         continue;
7265
7266       /* Any other register is bad.  */
7267       as_bad (_("`%s%s' not allowed with `%s%c'"),
7268               register_prefix, i.op[op].regs->reg_name,
7269               i.tm.name, i.suffix);
7270       return 0;
7271     }
7272   return 1;
7273 }
7274
7275 static int
7276 check_long_reg (void)
7277 {
7278   int op;
7279
7280   for (op = i.operands; --op >= 0;)
7281     /* Skip non-register operands. */
7282     if (i.types[op].bitfield.class != Reg)
7283       continue;
7284     /* Reject eight bit registers, except where the template requires
7285        them. (eg. movzb)  */
7286     else if (i.types[op].bitfield.byte
7287              && (i.tm.operand_types[op].bitfield.class == Reg
7288                  || i.tm.operand_types[op].bitfield.instance == Accum)
7289              && (i.tm.operand_types[op].bitfield.word
7290                  || i.tm.operand_types[op].bitfield.dword))
7291       {
7292         as_bad (_("`%s%s' not allowed with `%s%c'"),
7293                 register_prefix,
7294                 i.op[op].regs->reg_name,
7295                 i.tm.name,
7296                 i.suffix);
7297         return 0;
7298       }
7299     /* Error if the e prefix on a general reg is missing.  */
7300     else if (i.types[op].bitfield.word
7301              && (i.tm.operand_types[op].bitfield.class == Reg
7302                  || i.tm.operand_types[op].bitfield.instance == Accum)
7303              && i.tm.operand_types[op].bitfield.dword)
7304       {
7305         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7306                 register_prefix, i.op[op].regs->reg_name,
7307                 i.suffix);
7308         return 0;
7309       }
7310     /* Warn if the r prefix on a general reg is present.  */
7311     else if (i.types[op].bitfield.qword
7312              && (i.tm.operand_types[op].bitfield.class == Reg
7313                  || i.tm.operand_types[op].bitfield.instance == Accum)
7314              && i.tm.operand_types[op].bitfield.dword)
7315       {
7316         if (intel_syntax
7317             && i.tm.opcode_modifier.toqword
7318             && i.types[0].bitfield.class != RegSIMD)
7319           {
7320             /* Convert to QWORD.  We want REX byte. */
7321             i.suffix = QWORD_MNEM_SUFFIX;
7322           }
7323         else
7324           {
7325             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7326                     register_prefix, i.op[op].regs->reg_name,
7327                     i.suffix);
7328             return 0;
7329           }
7330       }
7331   return 1;
7332 }
7333
7334 static int
7335 check_qword_reg (void)
7336 {
7337   int op;
7338
7339   for (op = i.operands; --op >= 0; )
7340     /* Skip non-register operands. */
7341     if (i.types[op].bitfield.class != Reg)
7342       continue;
7343     /* Reject eight bit registers, except where the template requires
7344        them. (eg. movzb)  */
7345     else if (i.types[op].bitfield.byte
7346              && (i.tm.operand_types[op].bitfield.class == Reg
7347                  || i.tm.operand_types[op].bitfield.instance == Accum)
7348              && (i.tm.operand_types[op].bitfield.word
7349                  || i.tm.operand_types[op].bitfield.dword))
7350       {
7351         as_bad (_("`%s%s' not allowed with `%s%c'"),
7352                 register_prefix,
7353                 i.op[op].regs->reg_name,
7354                 i.tm.name,
7355                 i.suffix);
7356         return 0;
7357       }
7358     /* Warn if the r prefix on a general reg is missing.  */
7359     else if ((i.types[op].bitfield.word
7360               || i.types[op].bitfield.dword)
7361              && (i.tm.operand_types[op].bitfield.class == Reg
7362                  || i.tm.operand_types[op].bitfield.instance == Accum)
7363              && i.tm.operand_types[op].bitfield.qword)
7364       {
7365         /* Prohibit these changes in the 64bit mode, since the
7366            lowering is more complicated.  */
7367         if (intel_syntax
7368             && i.tm.opcode_modifier.todword
7369             && i.types[0].bitfield.class != RegSIMD)
7370           {
7371             /* Convert to DWORD.  We don't want REX byte. */
7372             i.suffix = LONG_MNEM_SUFFIX;
7373           }
7374         else
7375           {
7376             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7377                     register_prefix, i.op[op].regs->reg_name,
7378                     i.suffix);
7379             return 0;
7380           }
7381       }
7382   return 1;
7383 }
7384
7385 static int
7386 check_word_reg (void)
7387 {
7388   int op;
7389   for (op = i.operands; --op >= 0;)
7390     /* Skip non-register operands. */
7391     if (i.types[op].bitfield.class != Reg)
7392       continue;
7393     /* Reject eight bit registers, except where the template requires
7394        them. (eg. movzb)  */
7395     else if (i.types[op].bitfield.byte
7396              && (i.tm.operand_types[op].bitfield.class == Reg
7397                  || i.tm.operand_types[op].bitfield.instance == Accum)
7398              && (i.tm.operand_types[op].bitfield.word
7399                  || i.tm.operand_types[op].bitfield.dword))
7400       {
7401         as_bad (_("`%s%s' not allowed with `%s%c'"),
7402                 register_prefix,
7403                 i.op[op].regs->reg_name,
7404                 i.tm.name,
7405                 i.suffix);
7406         return 0;
7407       }
7408     /* Error if the e or r prefix on a general reg is present.  */
7409     else if ((i.types[op].bitfield.dword
7410                  || i.types[op].bitfield.qword)
7411              && (i.tm.operand_types[op].bitfield.class == Reg
7412                  || i.tm.operand_types[op].bitfield.instance == Accum)
7413              && i.tm.operand_types[op].bitfield.word)
7414       {
7415         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7416                 register_prefix, i.op[op].regs->reg_name,
7417                 i.suffix);
7418         return 0;
7419       }
7420   return 1;
7421 }
7422
7423 static int
7424 update_imm (unsigned int j)
7425 {
7426   i386_operand_type overlap = i.types[j];
7427   if ((overlap.bitfield.imm8
7428        || overlap.bitfield.imm8s
7429        || overlap.bitfield.imm16
7430        || overlap.bitfield.imm32
7431        || overlap.bitfield.imm32s
7432        || overlap.bitfield.imm64)
7433       && !operand_type_equal (&overlap, &imm8)
7434       && !operand_type_equal (&overlap, &imm8s)
7435       && !operand_type_equal (&overlap, &imm16)
7436       && !operand_type_equal (&overlap, &imm32)
7437       && !operand_type_equal (&overlap, &imm32s)
7438       && !operand_type_equal (&overlap, &imm64))
7439     {
7440       if (i.suffix)
7441         {
7442           i386_operand_type temp;
7443
7444           operand_type_set (&temp, 0);
7445           if (i.suffix == BYTE_MNEM_SUFFIX)
7446             {
7447               temp.bitfield.imm8 = overlap.bitfield.imm8;
7448               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7449             }
7450           else if (i.suffix == WORD_MNEM_SUFFIX)
7451             temp.bitfield.imm16 = overlap.bitfield.imm16;
7452           else if (i.suffix == QWORD_MNEM_SUFFIX)
7453             {
7454               temp.bitfield.imm64 = overlap.bitfield.imm64;
7455               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7456             }
7457           else
7458             temp.bitfield.imm32 = overlap.bitfield.imm32;
7459           overlap = temp;
7460         }
7461       else if (operand_type_equal (&overlap, &imm16_32_32s)
7462                || operand_type_equal (&overlap, &imm16_32)
7463                || operand_type_equal (&overlap, &imm16_32s))
7464         {
7465           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7466             overlap = imm16;
7467           else
7468             overlap = imm32s;
7469         }
7470       else if (i.prefix[REX_PREFIX] & REX_W)
7471         overlap = operand_type_and (overlap, imm32s);
7472       else if (i.prefix[DATA_PREFIX])
7473         overlap = operand_type_and (overlap,
7474                                     flag_code != CODE_16BIT ? imm16 : imm32);
7475       if (!operand_type_equal (&overlap, &imm8)
7476           && !operand_type_equal (&overlap, &imm8s)
7477           && !operand_type_equal (&overlap, &imm16)
7478           && !operand_type_equal (&overlap, &imm32)
7479           && !operand_type_equal (&overlap, &imm32s)
7480           && !operand_type_equal (&overlap, &imm64))
7481         {
7482           as_bad (_("no instruction mnemonic suffix given; "
7483                     "can't determine immediate size"));
7484           return 0;
7485         }
7486     }
7487   i.types[j] = overlap;
7488
7489   return 1;
7490 }
7491
7492 static int
7493 finalize_imm (void)
7494 {
7495   unsigned int j, n;
7496
7497   /* Update the first 2 immediate operands.  */
7498   n = i.operands > 2 ? 2 : i.operands;
7499   if (n)
7500     {
7501       for (j = 0; j < n; j++)
7502         if (update_imm (j) == 0)
7503           return 0;
7504
7505       /* The 3rd operand can't be immediate operand.  */
7506       gas_assert (operand_type_check (i.types[2], imm) == 0);
7507     }
7508
7509   return 1;
7510 }
7511
7512 static int
7513 process_operands (void)
7514 {
7515   /* Default segment register this instruction will use for memory
7516      accesses.  0 means unknown.  This is only for optimizing out
7517      unnecessary segment overrides.  */
7518   const seg_entry *default_seg = 0;
7519
7520   if (i.tm.opcode_modifier.sse2avx)
7521     {
7522       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7523          need converting.  */
7524       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7525       i.prefix[REX_PREFIX] = 0;
7526       i.rex_encoding = 0;
7527     }
7528   /* ImmExt should be processed after SSE2AVX.  */
7529   else if (i.tm.opcode_modifier.immext)
7530     process_immext ();
7531
7532   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7533     {
7534       unsigned int dupl = i.operands;
7535       unsigned int dest = dupl - 1;
7536       unsigned int j;
7537
7538       /* The destination must be an xmm register.  */
7539       gas_assert (i.reg_operands
7540                   && MAX_OPERANDS > dupl
7541                   && operand_type_equal (&i.types[dest], &regxmm));
7542
7543       if (i.tm.operand_types[0].bitfield.instance == Accum
7544           && i.tm.operand_types[0].bitfield.xmmword)
7545         {
7546           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7547             {
7548               /* Keep xmm0 for instructions with VEX prefix and 3
7549                  sources.  */
7550               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7551               i.tm.operand_types[0].bitfield.class = RegSIMD;
7552               goto duplicate;
7553             }
7554           else
7555             {
7556               /* We remove the first xmm0 and keep the number of
7557                  operands unchanged, which in fact duplicates the
7558                  destination.  */
7559               for (j = 1; j < i.operands; j++)
7560                 {
7561                   i.op[j - 1] = i.op[j];
7562                   i.types[j - 1] = i.types[j];
7563                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7564                   i.flags[j - 1] = i.flags[j];
7565                 }
7566             }
7567         }
7568       else if (i.tm.opcode_modifier.implicit1stxmm0)
7569         {
7570           gas_assert ((MAX_OPERANDS - 1) > dupl
7571                       && (i.tm.opcode_modifier.vexsources
7572                           == VEX3SOURCES));
7573
7574           /* Add the implicit xmm0 for instructions with VEX prefix
7575              and 3 sources.  */
7576           for (j = i.operands; j > 0; j--)
7577             {
7578               i.op[j] = i.op[j - 1];
7579               i.types[j] = i.types[j - 1];
7580               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7581               i.flags[j] = i.flags[j - 1];
7582             }
7583           i.op[0].regs
7584             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7585           i.types[0] = regxmm;
7586           i.tm.operand_types[0] = regxmm;
7587
7588           i.operands += 2;
7589           i.reg_operands += 2;
7590           i.tm.operands += 2;
7591
7592           dupl++;
7593           dest++;
7594           i.op[dupl] = i.op[dest];
7595           i.types[dupl] = i.types[dest];
7596           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7597           i.flags[dupl] = i.flags[dest];
7598         }
7599       else
7600         {
7601         duplicate:
7602           i.operands++;
7603           i.reg_operands++;
7604           i.tm.operands++;
7605
7606           i.op[dupl] = i.op[dest];
7607           i.types[dupl] = i.types[dest];
7608           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7609           i.flags[dupl] = i.flags[dest];
7610         }
7611
7612        if (i.tm.opcode_modifier.immext)
7613          process_immext ();
7614     }
7615   else if (i.tm.operand_types[0].bitfield.instance == Accum
7616            && i.tm.operand_types[0].bitfield.xmmword)
7617     {
7618       unsigned int j;
7619
7620       for (j = 1; j < i.operands; j++)
7621         {
7622           i.op[j - 1] = i.op[j];
7623           i.types[j - 1] = i.types[j];
7624
7625           /* We need to adjust fields in i.tm since they are used by
7626              build_modrm_byte.  */
7627           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7628
7629           i.flags[j - 1] = i.flags[j];
7630         }
7631
7632       i.operands--;
7633       i.reg_operands--;
7634       i.tm.operands--;
7635     }
7636   else if (i.tm.opcode_modifier.implicitquadgroup)
7637     {
7638       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7639
7640       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7641       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7642       regnum = register_number (i.op[1].regs);
7643       first_reg_in_group = regnum & ~3;
7644       last_reg_in_group = first_reg_in_group + 3;
7645       if (regnum != first_reg_in_group)
7646         as_warn (_("source register `%s%s' implicitly denotes"
7647                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7648                  register_prefix, i.op[1].regs->reg_name,
7649                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7650                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7651                  i.tm.name);
7652     }
7653   else if (i.tm.opcode_modifier.regkludge)
7654     {
7655       /* The imul $imm, %reg instruction is converted into
7656          imul $imm, %reg, %reg, and the clr %reg instruction
7657          is converted into xor %reg, %reg.  */
7658
7659       unsigned int first_reg_op;
7660
7661       if (operand_type_check (i.types[0], reg))
7662         first_reg_op = 0;
7663       else
7664         first_reg_op = 1;
7665       /* Pretend we saw the extra register operand.  */
7666       gas_assert (i.reg_operands == 1
7667                   && i.op[first_reg_op + 1].regs == 0);
7668       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7669       i.types[first_reg_op + 1] = i.types[first_reg_op];
7670       i.operands++;
7671       i.reg_operands++;
7672     }
7673
7674   if (i.tm.opcode_modifier.modrm)
7675     {
7676       /* The opcode is completed (modulo i.tm.extension_opcode which
7677          must be put into the modrm byte).  Now, we make the modrm and
7678          index base bytes based on all the info we've collected.  */
7679
7680       default_seg = build_modrm_byte ();
7681     }
7682   else if (i.types[0].bitfield.class == SReg)
7683     {
7684       if (flag_code != CODE_64BIT
7685           ? i.tm.base_opcode == POP_SEG_SHORT
7686             && i.op[0].regs->reg_num == 1
7687           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7688             && i.op[0].regs->reg_num < 4)
7689         {
7690           as_bad (_("you can't `%s %s%s'"),
7691                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7692           return 0;
7693         }
7694       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7695         {
7696           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7697           i.tm.opcode_length = 2;
7698         }
7699       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7700     }
7701   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7702     {
7703       default_seg = &ds;
7704     }
7705   else if (i.tm.opcode_modifier.isstring)
7706     {
7707       /* For the string instructions that allow a segment override
7708          on one of their operands, the default segment is ds.  */
7709       default_seg = &ds;
7710     }
7711   else if (i.short_form)
7712     {
7713       /* The register or float register operand is in operand
7714          0 or 1.  */
7715       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7716
7717       /* Register goes in low 3 bits of opcode.  */
7718       i.tm.base_opcode |= i.op[op].regs->reg_num;
7719       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7720         i.rex |= REX_B;
7721       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7722         {
7723           /* Warn about some common errors, but press on regardless.
7724              The first case can be generated by gcc (<= 2.8.1).  */
7725           if (i.operands == 2)
7726             {
7727               /* Reversed arguments on faddp, fsubp, etc.  */
7728               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7729                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7730                        register_prefix, i.op[intel_syntax].regs->reg_name);
7731             }
7732           else
7733             {
7734               /* Extraneous `l' suffix on fp insn.  */
7735               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7736                        register_prefix, i.op[0].regs->reg_name);
7737             }
7738         }
7739     }
7740
7741   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7742       && i.tm.base_opcode == 0x8d /* lea */
7743       && !is_any_vex_encoding(&i.tm))
7744     {
7745       if (!quiet_warnings)
7746         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7747       if (optimize)
7748         {
7749           i.seg[0] = NULL;
7750           i.prefix[SEG_PREFIX] = 0;
7751         }
7752     }
7753
7754   /* If a segment was explicitly specified, and the specified segment
7755      is neither the default nor the one already recorded from a prefix,
7756      use an opcode prefix to select it.  If we never figured out what
7757      the default segment is, then default_seg will be zero at this
7758      point, and the specified segment prefix will always be used.  */
7759   if (i.seg[0]
7760       && i.seg[0] != default_seg
7761       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7762     {
7763       if (!add_prefix (i.seg[0]->seg_prefix))
7764         return 0;
7765     }
7766   return 1;
7767 }
7768
7769 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7770                                  bfd_boolean do_sse2avx)
7771 {
7772   if (r->reg_flags & RegRex)
7773     {
7774       if (i.rex & rex_bit)
7775         as_bad (_("same type of prefix used twice"));
7776       i.rex |= rex_bit;
7777     }
7778   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7779     {
7780       gas_assert (i.vex.register_specifier == r);
7781       i.vex.register_specifier += 8;
7782     }
7783
7784   if (r->reg_flags & RegVRex)
7785     i.vrex |= rex_bit;
7786 }
7787
7788 static const seg_entry *
7789 build_modrm_byte (void)
7790 {
7791   const seg_entry *default_seg = 0;
7792   unsigned int source, dest;
7793   int vex_3_sources;
7794
7795   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7796   if (vex_3_sources)
7797     {
7798       unsigned int nds, reg_slot;
7799       expressionS *exp;
7800
7801       dest = i.operands - 1;
7802       nds = dest - 1;
7803
7804       /* There are 2 kinds of instructions:
7805          1. 5 operands: 4 register operands or 3 register operands
7806          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7807          VexW0 or VexW1.  The destination must be either XMM, YMM or
7808          ZMM register.
7809          2. 4 operands: 4 register operands or 3 register operands
7810          plus 1 memory operand, with VexXDS.  */
7811       gas_assert ((i.reg_operands == 4
7812                    || (i.reg_operands == 3 && i.mem_operands == 1))
7813                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7814                   && i.tm.opcode_modifier.vexw
7815                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7816
7817       /* If VexW1 is set, the first non-immediate operand is the source and
7818          the second non-immediate one is encoded in the immediate operand.  */
7819       if (i.tm.opcode_modifier.vexw == VEXW1)
7820         {
7821           source = i.imm_operands;
7822           reg_slot = i.imm_operands + 1;
7823         }
7824       else
7825         {
7826           source = i.imm_operands + 1;
7827           reg_slot = i.imm_operands;
7828         }
7829
7830       if (i.imm_operands == 0)
7831         {
7832           /* When there is no immediate operand, generate an 8bit
7833              immediate operand to encode the first operand.  */
7834           exp = &im_expressions[i.imm_operands++];
7835           i.op[i.operands].imms = exp;
7836           i.types[i.operands] = imm8;
7837           i.operands++;
7838
7839           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7840           exp->X_op = O_constant;
7841           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7842           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7843         }
7844       else
7845         {
7846           gas_assert (i.imm_operands == 1);
7847           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7848           gas_assert (!i.tm.opcode_modifier.immext);
7849
7850           /* Turn on Imm8 again so that output_imm will generate it.  */
7851           i.types[0].bitfield.imm8 = 1;
7852
7853           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7854           i.op[0].imms->X_add_number
7855               |= register_number (i.op[reg_slot].regs) << 4;
7856           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7857         }
7858
7859       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7860       i.vex.register_specifier = i.op[nds].regs;
7861     }
7862   else
7863     source = dest = 0;
7864
7865   /* i.reg_operands MUST be the number of real register operands;
7866      implicit registers do not count.  If there are 3 register
7867      operands, it must be a instruction with VexNDS.  For a
7868      instruction with VexNDD, the destination register is encoded
7869      in VEX prefix.  If there are 4 register operands, it must be
7870      a instruction with VEX prefix and 3 sources.  */
7871   if (i.mem_operands == 0
7872       && ((i.reg_operands == 2
7873            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7874           || (i.reg_operands == 3
7875               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7876           || (i.reg_operands == 4 && vex_3_sources)))
7877     {
7878       switch (i.operands)
7879         {
7880         case 2:
7881           source = 0;
7882           break;
7883         case 3:
7884           /* When there are 3 operands, one of them may be immediate,
7885              which may be the first or the last operand.  Otherwise,
7886              the first operand must be shift count register (cl) or it
7887              is an instruction with VexNDS. */
7888           gas_assert (i.imm_operands == 1
7889                       || (i.imm_operands == 0
7890                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7891                               || (i.types[0].bitfield.instance == RegC
7892                                   && i.types[0].bitfield.byte))));
7893           if (operand_type_check (i.types[0], imm)
7894               || (i.types[0].bitfield.instance == RegC
7895                   && i.types[0].bitfield.byte))
7896             source = 1;
7897           else
7898             source = 0;
7899           break;
7900         case 4:
7901           /* When there are 4 operands, the first two must be 8bit
7902              immediate operands. The source operand will be the 3rd
7903              one.
7904
7905              For instructions with VexNDS, if the first operand
7906              an imm8, the source operand is the 2nd one.  If the last
7907              operand is imm8, the source operand is the first one.  */
7908           gas_assert ((i.imm_operands == 2
7909                        && i.types[0].bitfield.imm8
7910                        && i.types[1].bitfield.imm8)
7911                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7912                           && i.imm_operands == 1
7913                           && (i.types[0].bitfield.imm8
7914                               || i.types[i.operands - 1].bitfield.imm8
7915                               || i.rounding)));
7916           if (i.imm_operands == 2)
7917             source = 2;
7918           else
7919             {
7920               if (i.types[0].bitfield.imm8)
7921                 source = 1;
7922               else
7923                 source = 0;
7924             }
7925           break;
7926         case 5:
7927           if (is_evex_encoding (&i.tm))
7928             {
7929               /* For EVEX instructions, when there are 5 operands, the
7930                  first one must be immediate operand.  If the second one
7931                  is immediate operand, the source operand is the 3th
7932                  one.  If the last one is immediate operand, the source
7933                  operand is the 2nd one.  */
7934               gas_assert (i.imm_operands == 2
7935                           && i.tm.opcode_modifier.sae
7936                           && operand_type_check (i.types[0], imm));
7937               if (operand_type_check (i.types[1], imm))
7938                 source = 2;
7939               else if (operand_type_check (i.types[4], imm))
7940                 source = 1;
7941               else
7942                 abort ();
7943             }
7944           break;
7945         default:
7946           abort ();
7947         }
7948
7949       if (!vex_3_sources)
7950         {
7951           dest = source + 1;
7952
7953           /* RC/SAE operand could be between DEST and SRC.  That happens
7954              when one operand is GPR and the other one is XMM/YMM/ZMM
7955              register.  */
7956           if (i.rounding && i.rounding->operand == (int) dest)
7957             dest++;
7958
7959           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7960             {
7961               /* For instructions with VexNDS, the register-only source
7962                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7963                  register.  It is encoded in VEX prefix.  */
7964
7965               i386_operand_type op;
7966               unsigned int vvvv;
7967
7968               /* Swap two source operands if needed.  */
7969               if (i.tm.opcode_modifier.swapsources)
7970                 {
7971                   vvvv = source;
7972                   source = dest;
7973                 }
7974               else
7975                 vvvv = dest;
7976
7977               op = i.tm.operand_types[vvvv];
7978               if ((dest + 1) >= i.operands
7979                   || ((op.bitfield.class != Reg
7980                        || (!op.bitfield.dword && !op.bitfield.qword))
7981                       && op.bitfield.class != RegSIMD
7982                       && !operand_type_equal (&op, &regmask)))
7983                 abort ();
7984               i.vex.register_specifier = i.op[vvvv].regs;
7985               dest++;
7986             }
7987         }
7988
7989       i.rm.mode = 3;
7990       /* One of the register operands will be encoded in the i.rm.reg
7991          field, the other in the combined i.rm.mode and i.rm.regmem
7992          fields.  If no form of this instruction supports a memory
7993          destination operand, then we assume the source operand may
7994          sometimes be a memory operand and so we need to store the
7995          destination in the i.rm.reg field.  */
7996       if (!i.tm.opcode_modifier.regmem
7997           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7998         {
7999           i.rm.reg = i.op[dest].regs->reg_num;
8000           i.rm.regmem = i.op[source].regs->reg_num;
8001           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
8002           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
8003         }
8004       else
8005         {
8006           i.rm.reg = i.op[source].regs->reg_num;
8007           i.rm.regmem = i.op[dest].regs->reg_num;
8008           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8009           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8010         }
8011       if (flag_code != CODE_64BIT && (i.rex & REX_R))
8012         {
8013           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8014             abort ();
8015           i.rex &= ~REX_R;
8016           add_prefix (LOCK_PREFIX_OPCODE);
8017         }
8018     }
8019   else
8020     {                   /* If it's not 2 reg operands...  */
8021       unsigned int mem;
8022
8023       if (i.mem_operands)
8024         {
8025           unsigned int fake_zero_displacement = 0;
8026           unsigned int op;
8027
8028           for (op = 0; op < i.operands; op++)
8029             if (i.flags[op] & Operand_Mem)
8030               break;
8031           gas_assert (op < i.operands);
8032
8033           if (i.tm.opcode_modifier.sib)
8034             {
8035               /* The index register of VSIB shouldn't be RegIZ.  */
8036               if (i.tm.opcode_modifier.sib != SIBMEM
8037                   && i.index_reg->reg_num == RegIZ)
8038                 abort ();
8039
8040               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8041               if (!i.base_reg)
8042                 {
8043                   i.sib.base = NO_BASE_REGISTER;
8044                   i.sib.scale = i.log2_scale_factor;
8045                   i.types[op].bitfield.disp8 = 0;
8046                   i.types[op].bitfield.disp16 = 0;
8047                   i.types[op].bitfield.disp64 = 0;
8048                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8049                     {
8050                       /* Must be 32 bit */
8051                       i.types[op].bitfield.disp32 = 1;
8052                       i.types[op].bitfield.disp32s = 0;
8053                     }
8054                   else
8055                     {
8056                       i.types[op].bitfield.disp32 = 0;
8057                       i.types[op].bitfield.disp32s = 1;
8058                     }
8059                 }
8060
8061               /* Since the mandatory SIB always has index register, so
8062                  the code logic remains unchanged. The non-mandatory SIB
8063                  without index register is allowed and will be handled
8064                  later.  */
8065               if (i.index_reg)
8066                 {
8067                   if (i.index_reg->reg_num == RegIZ)
8068                     i.sib.index = NO_INDEX_REGISTER;
8069                   else
8070                     i.sib.index = i.index_reg->reg_num;
8071                   set_rex_vrex (i.index_reg, REX_X, FALSE);
8072                 }
8073             }
8074
8075           default_seg = &ds;
8076
8077           if (i.base_reg == 0)
8078             {
8079               i.rm.mode = 0;
8080               if (!i.disp_operands)
8081                 fake_zero_displacement = 1;
8082               if (i.index_reg == 0)
8083                 {
8084                   i386_operand_type newdisp;
8085
8086                   /* Both check for VSIB and mandatory non-vector SIB. */
8087                   gas_assert (!i.tm.opcode_modifier.sib
8088                               || i.tm.opcode_modifier.sib == SIBMEM);
8089                   /* Operand is just <disp>  */
8090                   if (flag_code == CODE_64BIT)
8091                     {
8092                       /* 64bit mode overwrites the 32bit absolute
8093                          addressing by RIP relative addressing and
8094                          absolute addressing is encoded by one of the
8095                          redundant SIB forms.  */
8096                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8097                       i.sib.base = NO_BASE_REGISTER;
8098                       i.sib.index = NO_INDEX_REGISTER;
8099                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8100                     }
8101                   else if ((flag_code == CODE_16BIT)
8102                            ^ (i.prefix[ADDR_PREFIX] != 0))
8103                     {
8104                       i.rm.regmem = NO_BASE_REGISTER_16;
8105                       newdisp = disp16;
8106                     }
8107                   else
8108                     {
8109                       i.rm.regmem = NO_BASE_REGISTER;
8110                       newdisp = disp32;
8111                     }
8112                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8113                   i.types[op] = operand_type_or (i.types[op], newdisp);
8114                 }
8115               else if (!i.tm.opcode_modifier.sib)
8116                 {
8117                   /* !i.base_reg && i.index_reg  */
8118                   if (i.index_reg->reg_num == RegIZ)
8119                     i.sib.index = NO_INDEX_REGISTER;
8120                   else
8121                     i.sib.index = i.index_reg->reg_num;
8122                   i.sib.base = NO_BASE_REGISTER;
8123                   i.sib.scale = i.log2_scale_factor;
8124                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8125                   i.types[op].bitfield.disp8 = 0;
8126                   i.types[op].bitfield.disp16 = 0;
8127                   i.types[op].bitfield.disp64 = 0;
8128                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8129                     {
8130                       /* Must be 32 bit */
8131                       i.types[op].bitfield.disp32 = 1;
8132                       i.types[op].bitfield.disp32s = 0;
8133                     }
8134                   else
8135                     {
8136                       i.types[op].bitfield.disp32 = 0;
8137                       i.types[op].bitfield.disp32s = 1;
8138                     }
8139                   if ((i.index_reg->reg_flags & RegRex) != 0)
8140                     i.rex |= REX_X;
8141                 }
8142             }
8143           /* RIP addressing for 64bit mode.  */
8144           else if (i.base_reg->reg_num == RegIP)
8145             {
8146               gas_assert (!i.tm.opcode_modifier.sib);
8147               i.rm.regmem = NO_BASE_REGISTER;
8148               i.types[op].bitfield.disp8 = 0;
8149               i.types[op].bitfield.disp16 = 0;
8150               i.types[op].bitfield.disp32 = 0;
8151               i.types[op].bitfield.disp32s = 1;
8152               i.types[op].bitfield.disp64 = 0;
8153               i.flags[op] |= Operand_PCrel;
8154               if (! i.disp_operands)
8155                 fake_zero_displacement = 1;
8156             }
8157           else if (i.base_reg->reg_type.bitfield.word)
8158             {
8159               gas_assert (!i.tm.opcode_modifier.sib);
8160               switch (i.base_reg->reg_num)
8161                 {
8162                 case 3: /* (%bx)  */
8163                   if (i.index_reg == 0)
8164                     i.rm.regmem = 7;
8165                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8166                     i.rm.regmem = i.index_reg->reg_num - 6;
8167                   break;
8168                 case 5: /* (%bp)  */
8169                   default_seg = &ss;
8170                   if (i.index_reg == 0)
8171                     {
8172                       i.rm.regmem = 6;
8173                       if (operand_type_check (i.types[op], disp) == 0)
8174                         {
8175                           /* fake (%bp) into 0(%bp)  */
8176                           if (i.disp_encoding == disp_encoding_16bit)
8177                             i.types[op].bitfield.disp16 = 1;
8178                           else
8179                             i.types[op].bitfield.disp8 = 1;
8180                           fake_zero_displacement = 1;
8181                         }
8182                     }
8183                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8184                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8185                   break;
8186                 default: /* (%si) -> 4 or (%di) -> 5  */
8187                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8188                 }
8189               if (!fake_zero_displacement
8190                   && !i.disp_operands
8191                   && i.disp_encoding)
8192                 {
8193                   fake_zero_displacement = 1;
8194                   if (i.disp_encoding == disp_encoding_8bit)
8195                     i.types[op].bitfield.disp8 = 1;
8196                   else
8197                     i.types[op].bitfield.disp16 = 1;
8198                 }
8199               i.rm.mode = mode_from_disp_size (i.types[op]);
8200             }
8201           else /* i.base_reg and 32/64 bit mode  */
8202             {
8203               if (flag_code == CODE_64BIT
8204                   && operand_type_check (i.types[op], disp))
8205                 {
8206                   i.types[op].bitfield.disp16 = 0;
8207                   i.types[op].bitfield.disp64 = 0;
8208                   if (i.prefix[ADDR_PREFIX] == 0)
8209                     {
8210                       i.types[op].bitfield.disp32 = 0;
8211                       i.types[op].bitfield.disp32s = 1;
8212                     }
8213                   else
8214                     {
8215                       i.types[op].bitfield.disp32 = 1;
8216                       i.types[op].bitfield.disp32s = 0;
8217                     }
8218                 }
8219
8220               if (!i.tm.opcode_modifier.sib)
8221                 i.rm.regmem = i.base_reg->reg_num;
8222               if ((i.base_reg->reg_flags & RegRex) != 0)
8223                 i.rex |= REX_B;
8224               i.sib.base = i.base_reg->reg_num;
8225               /* x86-64 ignores REX prefix bit here to avoid decoder
8226                  complications.  */
8227               if (!(i.base_reg->reg_flags & RegRex)
8228                   && (i.base_reg->reg_num == EBP_REG_NUM
8229                    || i.base_reg->reg_num == ESP_REG_NUM))
8230                   default_seg = &ss;
8231               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8232                 {
8233                   fake_zero_displacement = 1;
8234                   if (i.disp_encoding == disp_encoding_32bit)
8235                     i.types[op].bitfield.disp32 = 1;
8236                   else
8237                     i.types[op].bitfield.disp8 = 1;
8238                 }
8239               i.sib.scale = i.log2_scale_factor;
8240               if (i.index_reg == 0)
8241                 {
8242                   /* Only check for VSIB. */
8243                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8244                               && i.tm.opcode_modifier.sib != VECSIB256
8245                               && i.tm.opcode_modifier.sib != VECSIB512);
8246
8247                   /* <disp>(%esp) becomes two byte modrm with no index
8248                      register.  We've already stored the code for esp
8249                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8250                      Any base register besides %esp will not use the
8251                      extra modrm byte.  */
8252                   i.sib.index = NO_INDEX_REGISTER;
8253                 }
8254               else if (!i.tm.opcode_modifier.sib)
8255                 {
8256                   if (i.index_reg->reg_num == RegIZ)
8257                     i.sib.index = NO_INDEX_REGISTER;
8258                   else
8259                     i.sib.index = i.index_reg->reg_num;
8260                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8261                   if ((i.index_reg->reg_flags & RegRex) != 0)
8262                     i.rex |= REX_X;
8263                 }
8264
8265               if (i.disp_operands
8266                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8267                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8268                 i.rm.mode = 0;
8269               else
8270                 {
8271                   if (!fake_zero_displacement
8272                       && !i.disp_operands
8273                       && i.disp_encoding)
8274                     {
8275                       fake_zero_displacement = 1;
8276                       if (i.disp_encoding == disp_encoding_8bit)
8277                         i.types[op].bitfield.disp8 = 1;
8278                       else
8279                         i.types[op].bitfield.disp32 = 1;
8280                     }
8281                   i.rm.mode = mode_from_disp_size (i.types[op]);
8282                 }
8283             }
8284
8285           if (fake_zero_displacement)
8286             {
8287               /* Fakes a zero displacement assuming that i.types[op]
8288                  holds the correct displacement size.  */
8289               expressionS *exp;
8290
8291               gas_assert (i.op[op].disps == 0);
8292               exp = &disp_expressions[i.disp_operands++];
8293               i.op[op].disps = exp;
8294               exp->X_op = O_constant;
8295               exp->X_add_number = 0;
8296               exp->X_add_symbol = (symbolS *) 0;
8297               exp->X_op_symbol = (symbolS *) 0;
8298             }
8299
8300           mem = op;
8301         }
8302       else
8303         mem = ~0;
8304
8305       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8306         {
8307           if (operand_type_check (i.types[0], imm))
8308             i.vex.register_specifier = NULL;
8309           else
8310             {
8311               /* VEX.vvvv encodes one of the sources when the first
8312                  operand is not an immediate.  */
8313               if (i.tm.opcode_modifier.vexw == VEXW0)
8314                 i.vex.register_specifier = i.op[0].regs;
8315               else
8316                 i.vex.register_specifier = i.op[1].regs;
8317             }
8318
8319           /* Destination is a XMM register encoded in the ModRM.reg
8320              and VEX.R bit.  */
8321           i.rm.reg = i.op[2].regs->reg_num;
8322           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8323             i.rex |= REX_R;
8324
8325           /* ModRM.rm and VEX.B encodes the other source.  */
8326           if (!i.mem_operands)
8327             {
8328               i.rm.mode = 3;
8329
8330               if (i.tm.opcode_modifier.vexw == VEXW0)
8331                 i.rm.regmem = i.op[1].regs->reg_num;
8332               else
8333                 i.rm.regmem = i.op[0].regs->reg_num;
8334
8335               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8336                 i.rex |= REX_B;
8337             }
8338         }
8339       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8340         {
8341           i.vex.register_specifier = i.op[2].regs;
8342           if (!i.mem_operands)
8343             {
8344               i.rm.mode = 3;
8345               i.rm.regmem = i.op[1].regs->reg_num;
8346               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8347                 i.rex |= REX_B;
8348             }
8349         }
8350       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8351          (if any) based on i.tm.extension_opcode.  Again, we must be
8352          careful to make sure that segment/control/debug/test/MMX
8353          registers are coded into the i.rm.reg field.  */
8354       else if (i.reg_operands)
8355         {
8356           unsigned int op;
8357           unsigned int vex_reg = ~0;
8358
8359           for (op = 0; op < i.operands; op++)
8360             if (i.types[op].bitfield.class == Reg
8361                 || i.types[op].bitfield.class == RegBND
8362                 || i.types[op].bitfield.class == RegMask
8363                 || i.types[op].bitfield.class == SReg
8364                 || i.types[op].bitfield.class == RegCR
8365                 || i.types[op].bitfield.class == RegDR
8366                 || i.types[op].bitfield.class == RegTR
8367                 || i.types[op].bitfield.class == RegSIMD
8368                 || i.types[op].bitfield.class == RegMMX)
8369               break;
8370
8371           if (vex_3_sources)
8372             op = dest;
8373           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8374             {
8375               /* For instructions with VexNDS, the register-only
8376                  source operand is encoded in VEX prefix. */
8377               gas_assert (mem != (unsigned int) ~0);
8378
8379               if (op > mem)
8380                 {
8381                   vex_reg = op++;
8382                   gas_assert (op < i.operands);
8383                 }
8384               else
8385                 {
8386                   /* Check register-only source operand when two source
8387                      operands are swapped.  */
8388                   if (!i.tm.operand_types[op].bitfield.baseindex
8389                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8390                     {
8391                       vex_reg = op;
8392                       op += 2;
8393                       gas_assert (mem == (vex_reg + 1)
8394                                   && op < i.operands);
8395                     }
8396                   else
8397                     {
8398                       vex_reg = op + 1;
8399                       gas_assert (vex_reg < i.operands);
8400                     }
8401                 }
8402             }
8403           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8404             {
8405               /* For instructions with VexNDD, the register destination
8406                  is encoded in VEX prefix.  */
8407               if (i.mem_operands == 0)
8408                 {
8409                   /* There is no memory operand.  */
8410                   gas_assert ((op + 2) == i.operands);
8411                   vex_reg = op + 1;
8412                 }
8413               else
8414                 {
8415                   /* There are only 2 non-immediate operands.  */
8416                   gas_assert (op < i.imm_operands + 2
8417                               && i.operands == i.imm_operands + 2);
8418                   vex_reg = i.imm_operands + 1;
8419                 }
8420             }
8421           else
8422             gas_assert (op < i.operands);
8423
8424           if (vex_reg != (unsigned int) ~0)
8425             {
8426               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8427
8428               if ((type->bitfield.class != Reg
8429                    || (!type->bitfield.dword && !type->bitfield.qword))
8430                   && type->bitfield.class != RegSIMD
8431                   && !operand_type_equal (type, &regmask))
8432                 abort ();
8433
8434               i.vex.register_specifier = i.op[vex_reg].regs;
8435             }
8436
8437           /* Don't set OP operand twice.  */
8438           if (vex_reg != op)
8439             {
8440               /* If there is an extension opcode to put here, the
8441                  register number must be put into the regmem field.  */
8442               if (i.tm.extension_opcode != None)
8443                 {
8444                   i.rm.regmem = i.op[op].regs->reg_num;
8445                   set_rex_vrex (i.op[op].regs, REX_B,
8446                                 i.tm.opcode_modifier.sse2avx);
8447                 }
8448               else
8449                 {
8450                   i.rm.reg = i.op[op].regs->reg_num;
8451                   set_rex_vrex (i.op[op].regs, REX_R,
8452                                 i.tm.opcode_modifier.sse2avx);
8453                 }
8454             }
8455
8456           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8457              must set it to 3 to indicate this is a register operand
8458              in the regmem field.  */
8459           if (!i.mem_operands)
8460             i.rm.mode = 3;
8461         }
8462
8463       /* Fill in i.rm.reg field with extension opcode (if any).  */
8464       if (i.tm.extension_opcode != None)
8465         i.rm.reg = i.tm.extension_opcode;
8466     }
8467   return default_seg;
8468 }
8469
8470 static INLINE void
8471 frag_opcode_byte (unsigned char byte)
8472 {
8473   if (now_seg != absolute_section)
8474     FRAG_APPEND_1_CHAR (byte);
8475   else
8476     ++abs_section_offset;
8477 }
8478
8479 static unsigned int
8480 flip_code16 (unsigned int code16)
8481 {
8482   gas_assert (i.tm.operands == 1);
8483
8484   return !(i.prefix[REX_PREFIX] & REX_W)
8485          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8486                       || i.tm.operand_types[0].bitfield.disp32s
8487                     : i.tm.operand_types[0].bitfield.disp16)
8488          ? CODE16 : 0;
8489 }
8490
8491 static void
8492 output_branch (void)
8493 {
8494   char *p;
8495   int size;
8496   int code16;
8497   int prefix;
8498   relax_substateT subtype;
8499   symbolS *sym;
8500   offsetT off;
8501
8502   if (now_seg == absolute_section)
8503     {
8504       as_bad (_("relaxable branches not supported in absolute section"));
8505       return;
8506     }
8507
8508   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8509   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8510
8511   prefix = 0;
8512   if (i.prefix[DATA_PREFIX] != 0)
8513     {
8514       prefix = 1;
8515       i.prefixes -= 1;
8516       code16 ^= flip_code16(code16);
8517     }
8518   /* Pentium4 branch hints.  */
8519   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8520       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8521     {
8522       prefix++;
8523       i.prefixes--;
8524     }
8525   if (i.prefix[REX_PREFIX] != 0)
8526     {
8527       prefix++;
8528       i.prefixes--;
8529     }
8530
8531   /* BND prefixed jump.  */
8532   if (i.prefix[BND_PREFIX] != 0)
8533     {
8534       prefix++;
8535       i.prefixes--;
8536     }
8537
8538   if (i.prefixes != 0)
8539     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8540
8541   /* It's always a symbol;  End frag & setup for relax.
8542      Make sure there is enough room in this frag for the largest
8543      instruction we may generate in md_convert_frag.  This is 2
8544      bytes for the opcode and room for the prefix and largest
8545      displacement.  */
8546   frag_grow (prefix + 2 + 4);
8547   /* Prefix and 1 opcode byte go in fr_fix.  */
8548   p = frag_more (prefix + 1);
8549   if (i.prefix[DATA_PREFIX] != 0)
8550     *p++ = DATA_PREFIX_OPCODE;
8551   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8552       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8553     *p++ = i.prefix[SEG_PREFIX];
8554   if (i.prefix[BND_PREFIX] != 0)
8555     *p++ = BND_PREFIX_OPCODE;
8556   if (i.prefix[REX_PREFIX] != 0)
8557     *p++ = i.prefix[REX_PREFIX];
8558   *p = i.tm.base_opcode;
8559
8560   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8561     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8562   else if (cpu_arch_flags.bitfield.cpui386)
8563     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8564   else
8565     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8566   subtype |= code16;
8567
8568   sym = i.op[0].disps->X_add_symbol;
8569   off = i.op[0].disps->X_add_number;
8570
8571   if (i.op[0].disps->X_op != O_constant
8572       && i.op[0].disps->X_op != O_symbol)
8573     {
8574       /* Handle complex expressions.  */
8575       sym = make_expr_symbol (i.op[0].disps);
8576       off = 0;
8577     }
8578
8579   /* 1 possible extra opcode + 4 byte displacement go in var part.
8580      Pass reloc in fr_var.  */
8581   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8582 }
8583
8584 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8585 /* Return TRUE iff PLT32 relocation should be used for branching to
8586    symbol S.  */
8587
8588 static bfd_boolean
8589 need_plt32_p (symbolS *s)
8590 {
8591   /* PLT32 relocation is ELF only.  */
8592   if (!IS_ELF)
8593     return FALSE;
8594
8595 #ifdef TE_SOLARIS
8596   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8597      krtld support it.  */
8598   return FALSE;
8599 #endif
8600
8601   /* Since there is no need to prepare for PLT branch on x86-64, we
8602      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8603      be used as a marker for 32-bit PC-relative branches.  */
8604   if (!object_64bit)
8605     return FALSE;
8606
8607   if (s == NULL)
8608     return FALSE;
8609
8610   /* Weak or undefined symbol need PLT32 relocation.  */
8611   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8612     return TRUE;
8613
8614   /* Non-global symbol doesn't need PLT32 relocation.  */
8615   if (! S_IS_EXTERNAL (s))
8616     return FALSE;
8617
8618   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8619      non-default visibilities are treated as normal global symbol
8620      so that PLT32 relocation can be used as a marker for 32-bit
8621      PC-relative branches.  It is useful for linker relaxation.  */
8622   return TRUE;
8623 }
8624 #endif
8625
8626 static void
8627 output_jump (void)
8628 {
8629   char *p;
8630   int size;
8631   fixS *fixP;
8632   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8633
8634   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8635     {
8636       /* This is a loop or jecxz type instruction.  */
8637       size = 1;
8638       if (i.prefix[ADDR_PREFIX] != 0)
8639         {
8640           frag_opcode_byte (ADDR_PREFIX_OPCODE);
8641           i.prefixes -= 1;
8642         }
8643       /* Pentium4 branch hints.  */
8644       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8645           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8646         {
8647           frag_opcode_byte (i.prefix[SEG_PREFIX]);
8648           i.prefixes--;
8649         }
8650     }
8651   else
8652     {
8653       int code16;
8654
8655       code16 = 0;
8656       if (flag_code == CODE_16BIT)
8657         code16 = CODE16;
8658
8659       if (i.prefix[DATA_PREFIX] != 0)
8660         {
8661           frag_opcode_byte (DATA_PREFIX_OPCODE);
8662           i.prefixes -= 1;
8663           code16 ^= flip_code16(code16);
8664         }
8665
8666       size = 4;
8667       if (code16)
8668         size = 2;
8669     }
8670
8671   /* BND prefixed jump.  */
8672   if (i.prefix[BND_PREFIX] != 0)
8673     {
8674       frag_opcode_byte (i.prefix[BND_PREFIX]);
8675       i.prefixes -= 1;
8676     }
8677
8678   if (i.prefix[REX_PREFIX] != 0)
8679     {
8680       frag_opcode_byte (i.prefix[REX_PREFIX]);
8681       i.prefixes -= 1;
8682     }
8683
8684   if (i.prefixes != 0)
8685     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8686
8687   if (now_seg == absolute_section)
8688     {
8689       abs_section_offset += i.tm.opcode_length + size;
8690       return;
8691     }
8692
8693   p = frag_more (i.tm.opcode_length + size);
8694   switch (i.tm.opcode_length)
8695     {
8696     case 2:
8697       *p++ = i.tm.base_opcode >> 8;
8698       /* Fall through.  */
8699     case 1:
8700       *p++ = i.tm.base_opcode;
8701       break;
8702     default:
8703       abort ();
8704     }
8705
8706 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8707   if (size == 4
8708       && jump_reloc == NO_RELOC
8709       && need_plt32_p (i.op[0].disps->X_add_symbol))
8710     jump_reloc = BFD_RELOC_X86_64_PLT32;
8711 #endif
8712
8713   jump_reloc = reloc (size, 1, 1, jump_reloc);
8714
8715   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8716                       i.op[0].disps, 1, jump_reloc);
8717
8718   /* All jumps handled here are signed, but don't use a signed limit
8719      check for 32 and 16 bit jumps as we want to allow wrap around at
8720      4G and 64k respectively.  */
8721   if (size == 1)
8722     fixP->fx_signed = 1;
8723 }
8724
8725 static void
8726 output_interseg_jump (void)
8727 {
8728   char *p;
8729   int size;
8730   int prefix;
8731   int code16;
8732
8733   code16 = 0;
8734   if (flag_code == CODE_16BIT)
8735     code16 = CODE16;
8736
8737   prefix = 0;
8738   if (i.prefix[DATA_PREFIX] != 0)
8739     {
8740       prefix = 1;
8741       i.prefixes -= 1;
8742       code16 ^= CODE16;
8743     }
8744
8745   gas_assert (!i.prefix[REX_PREFIX]);
8746
8747   size = 4;
8748   if (code16)
8749     size = 2;
8750
8751   if (i.prefixes != 0)
8752     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8753
8754   if (now_seg == absolute_section)
8755     {
8756       abs_section_offset += prefix + 1 + 2 + size;
8757       return;
8758     }
8759
8760   /* 1 opcode; 2 segment; offset  */
8761   p = frag_more (prefix + 1 + 2 + size);
8762
8763   if (i.prefix[DATA_PREFIX] != 0)
8764     *p++ = DATA_PREFIX_OPCODE;
8765
8766   if (i.prefix[REX_PREFIX] != 0)
8767     *p++ = i.prefix[REX_PREFIX];
8768
8769   *p++ = i.tm.base_opcode;
8770   if (i.op[1].imms->X_op == O_constant)
8771     {
8772       offsetT n = i.op[1].imms->X_add_number;
8773
8774       if (size == 2
8775           && !fits_in_unsigned_word (n)
8776           && !fits_in_signed_word (n))
8777         {
8778           as_bad (_("16-bit jump out of range"));
8779           return;
8780         }
8781       md_number_to_chars (p, n, size);
8782     }
8783   else
8784     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8785                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8786
8787   p += size;
8788   if (i.op[0].imms->X_op == O_constant)
8789     md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8790   else
8791     fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8792                  i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8793 }
8794
8795 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8796 void
8797 x86_cleanup (void)
8798 {
8799   char *p;
8800   asection *seg = now_seg;
8801   subsegT subseg = now_subseg;
8802   asection *sec;
8803   unsigned int alignment, align_size_1;
8804   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8805   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8806   unsigned int padding;
8807
8808   if (!IS_ELF || !x86_used_note)
8809     return;
8810
8811   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8812
8813   /* The .note.gnu.property section layout:
8814
8815      Field      Length          Contents
8816      ----       ----            ----
8817      n_namsz    4               4
8818      n_descsz   4               The note descriptor size
8819      n_type     4               NT_GNU_PROPERTY_TYPE_0
8820      n_name     4               "GNU"
8821      n_desc     n_descsz        The program property array
8822      ....       ....            ....
8823    */
8824
8825   /* Create the .note.gnu.property section.  */
8826   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8827   bfd_set_section_flags (sec,
8828                          (SEC_ALLOC
8829                           | SEC_LOAD
8830                           | SEC_DATA
8831                           | SEC_HAS_CONTENTS
8832                           | SEC_READONLY));
8833
8834   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8835     {
8836       align_size_1 = 7;
8837       alignment = 3;
8838     }
8839   else
8840     {
8841       align_size_1 = 3;
8842       alignment = 2;
8843     }
8844
8845   bfd_set_section_alignment (sec, alignment);
8846   elf_section_type (sec) = SHT_NOTE;
8847
8848   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8849                                   + 4-byte data  */
8850   isa_1_descsz_raw = 4 + 4 + 4;
8851   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8852   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8853
8854   feature_2_descsz_raw = isa_1_descsz;
8855   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8856                                       + 4-byte data  */
8857   feature_2_descsz_raw += 4 + 4 + 4;
8858   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8859   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8860                       & ~align_size_1);
8861
8862   descsz = feature_2_descsz;
8863   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8864   p = frag_more (4 + 4 + 4 + 4 + descsz);
8865
8866   /* Write n_namsz.  */
8867   md_number_to_chars (p, (valueT) 4, 4);
8868
8869   /* Write n_descsz.  */
8870   md_number_to_chars (p + 4, (valueT) descsz, 4);
8871
8872   /* Write n_type.  */
8873   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8874
8875   /* Write n_name.  */
8876   memcpy (p + 4 * 3, "GNU", 4);
8877
8878   /* Write 4-byte type.  */
8879   md_number_to_chars (p + 4 * 4,
8880                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8881
8882   /* Write 4-byte data size.  */
8883   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8884
8885   /* Write 4-byte data.  */
8886   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8887
8888   /* Zero out paddings.  */
8889   padding = isa_1_descsz - isa_1_descsz_raw;
8890   if (padding)
8891     memset (p + 4 * 7, 0, padding);
8892
8893   /* Write 4-byte type.  */
8894   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8895                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8896
8897   /* Write 4-byte data size.  */
8898   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8899
8900   /* Write 4-byte data.  */
8901   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8902                       (valueT) x86_feature_2_used, 4);
8903
8904   /* Zero out paddings.  */
8905   padding = feature_2_descsz - feature_2_descsz_raw;
8906   if (padding)
8907     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8908
8909   /* We probably can't restore the current segment, for there likely
8910      isn't one yet...  */
8911   if (seg && subseg)
8912     subseg_set (seg, subseg);
8913 }
8914 #endif
8915
8916 static unsigned int
8917 encoding_length (const fragS *start_frag, offsetT start_off,
8918                  const char *frag_now_ptr)
8919 {
8920   unsigned int len = 0;
8921
8922   if (start_frag != frag_now)
8923     {
8924       const fragS *fr = start_frag;
8925
8926       do {
8927         len += fr->fr_fix;
8928         fr = fr->fr_next;
8929       } while (fr && fr != frag_now);
8930     }
8931
8932   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8933 }
8934
8935 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8936    be macro-fused with conditional jumps.
8937    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8938    or is one of the following format:
8939
8940     cmp m, imm
8941     add m, imm
8942     sub m, imm
8943    test m, imm
8944     and m, imm
8945     inc m
8946     dec m
8947
8948    it is unfusible.  */
8949
8950 static int
8951 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8952 {
8953   /* No RIP address.  */
8954   if (i.base_reg && i.base_reg->reg_num == RegIP)
8955     return 0;
8956
8957   /* No VEX/EVEX encoding.  */
8958   if (is_any_vex_encoding (&i.tm))
8959     return 0;
8960
8961   /* add, sub without add/sub m, imm.  */
8962   if (i.tm.base_opcode <= 5
8963       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8964       || ((i.tm.base_opcode | 3) == 0x83
8965           && (i.tm.extension_opcode == 0x5
8966               || i.tm.extension_opcode == 0x0)))
8967     {
8968       *mf_cmp_p = mf_cmp_alu_cmp;
8969       return !(i.mem_operands && i.imm_operands);
8970     }
8971
8972   /* and without and m, imm.  */
8973   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8974       || ((i.tm.base_opcode | 3) == 0x83
8975           && i.tm.extension_opcode == 0x4))
8976     {
8977       *mf_cmp_p = mf_cmp_test_and;
8978       return !(i.mem_operands && i.imm_operands);
8979     }
8980
8981   /* test without test m imm.  */
8982   if ((i.tm.base_opcode | 1) == 0x85
8983       || (i.tm.base_opcode | 1) == 0xa9
8984       || ((i.tm.base_opcode | 1) == 0xf7
8985           && i.tm.extension_opcode == 0))
8986     {
8987       *mf_cmp_p = mf_cmp_test_and;
8988       return !(i.mem_operands && i.imm_operands);
8989     }
8990
8991   /* cmp without cmp m, imm.  */
8992   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8993       || ((i.tm.base_opcode | 3) == 0x83
8994           && (i.tm.extension_opcode == 0x7)))
8995     {
8996       *mf_cmp_p = mf_cmp_alu_cmp;
8997       return !(i.mem_operands && i.imm_operands);
8998     }
8999
9000   /* inc, dec without inc/dec m.   */
9001   if ((i.tm.cpu_flags.bitfield.cpuno64
9002        && (i.tm.base_opcode | 0xf) == 0x4f)
9003       || ((i.tm.base_opcode | 1) == 0xff
9004           && i.tm.extension_opcode <= 0x1))
9005     {
9006       *mf_cmp_p = mf_cmp_incdec;
9007       return !i.mem_operands;
9008     }
9009
9010   return 0;
9011 }
9012
9013 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
9014
9015 static int
9016 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9017 {
9018   /* NB: Don't work with COND_JUMP86 without i386.  */
9019   if (!align_branch_power
9020       || now_seg == absolute_section
9021       || !cpu_arch_flags.bitfield.cpui386
9022       || !(align_branch & align_branch_fused_bit))
9023     return 0;
9024
9025   if (maybe_fused_with_jcc_p (mf_cmp_p))
9026     {
9027       if (last_insn.kind == last_insn_other
9028           || last_insn.seg != now_seg)
9029         return 1;
9030       if (flag_debug)
9031         as_warn_where (last_insn.file, last_insn.line,
9032                        _("`%s` skips -malign-branch-boundary on `%s`"),
9033                        last_insn.name, i.tm.name);
9034     }
9035
9036   return 0;
9037 }
9038
9039 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9040
9041 static int
9042 add_branch_prefix_frag_p (void)
9043 {
9044   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9045      to PadLock instructions since they include prefixes in opcode.  */
9046   if (!align_branch_power
9047       || !align_branch_prefix_size
9048       || now_seg == absolute_section
9049       || i.tm.cpu_flags.bitfield.cpupadlock
9050       || !cpu_arch_flags.bitfield.cpui386)
9051     return 0;
9052
9053   /* Don't add prefix if it is a prefix or there is no operand in case
9054      that segment prefix is special.  */
9055   if (!i.operands || i.tm.opcode_modifier.isprefix)
9056     return 0;
9057
9058   if (last_insn.kind == last_insn_other
9059       || last_insn.seg != now_seg)
9060     return 1;
9061
9062   if (flag_debug)
9063     as_warn_where (last_insn.file, last_insn.line,
9064                    _("`%s` skips -malign-branch-boundary on `%s`"),
9065                    last_insn.name, i.tm.name);
9066
9067   return 0;
9068 }
9069
9070 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9071
9072 static int
9073 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9074                            enum mf_jcc_kind *mf_jcc_p)
9075 {
9076   int add_padding;
9077
9078   /* NB: Don't work with COND_JUMP86 without i386.  */
9079   if (!align_branch_power
9080       || now_seg == absolute_section
9081       || !cpu_arch_flags.bitfield.cpui386)
9082     return 0;
9083
9084   add_padding = 0;
9085
9086   /* Check for jcc and direct jmp.  */
9087   if (i.tm.opcode_modifier.jump == JUMP)
9088     {
9089       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9090         {
9091           *branch_p = align_branch_jmp;
9092           add_padding = align_branch & align_branch_jmp_bit;
9093         }
9094       else
9095         {
9096           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9097              igore the lowest bit.  */
9098           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9099           *branch_p = align_branch_jcc;
9100           if ((align_branch & align_branch_jcc_bit))
9101             add_padding = 1;
9102         }
9103     }
9104   else if (is_any_vex_encoding (&i.tm))
9105     return 0;
9106   else if ((i.tm.base_opcode | 1) == 0xc3)
9107     {
9108       /* Near ret.  */
9109       *branch_p = align_branch_ret;
9110       if ((align_branch & align_branch_ret_bit))
9111         add_padding = 1;
9112     }
9113   else
9114     {
9115       /* Check for indirect jmp, direct and indirect calls.  */
9116       if (i.tm.base_opcode == 0xe8)
9117         {
9118           /* Direct call.  */
9119           *branch_p = align_branch_call;
9120           if ((align_branch & align_branch_call_bit))
9121             add_padding = 1;
9122         }
9123       else if (i.tm.base_opcode == 0xff
9124                && (i.tm.extension_opcode == 2
9125                    || i.tm.extension_opcode == 4))
9126         {
9127           /* Indirect call and jmp.  */
9128           *branch_p = align_branch_indirect;
9129           if ((align_branch & align_branch_indirect_bit))
9130             add_padding = 1;
9131         }
9132
9133       if (add_padding
9134           && i.disp_operands
9135           && tls_get_addr
9136           && (i.op[0].disps->X_op == O_symbol
9137               || (i.op[0].disps->X_op == O_subtract
9138                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9139         {
9140           symbolS *s = i.op[0].disps->X_add_symbol;
9141           /* No padding to call to global or undefined tls_get_addr.  */
9142           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9143               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9144             return 0;
9145         }
9146     }
9147
9148   if (add_padding
9149       && last_insn.kind != last_insn_other
9150       && last_insn.seg == now_seg)
9151     {
9152       if (flag_debug)
9153         as_warn_where (last_insn.file, last_insn.line,
9154                        _("`%s` skips -malign-branch-boundary on `%s`"),
9155                        last_insn.name, i.tm.name);
9156       return 0;
9157     }
9158
9159   return add_padding;
9160 }
9161
9162 static void
9163 output_insn (void)
9164 {
9165   fragS *insn_start_frag;
9166   offsetT insn_start_off;
9167   fragS *fragP = NULL;
9168   enum align_branch_kind branch = align_branch_none;
9169   /* The initializer is arbitrary just to avoid uninitialized error.
9170      it's actually either assigned in add_branch_padding_frag_p
9171      or never be used.  */
9172   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9173
9174 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9175   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9176     {
9177       if ((i.xstate & xstate_tmm) == xstate_tmm
9178           || i.tm.cpu_flags.bitfield.cpuamx_tile)
9179         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9180
9181       if (i.tm.cpu_flags.bitfield.cpu8087
9182           || i.tm.cpu_flags.bitfield.cpu287
9183           || i.tm.cpu_flags.bitfield.cpu387
9184           || i.tm.cpu_flags.bitfield.cpu687
9185           || i.tm.cpu_flags.bitfield.cpufisttp)
9186         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9187
9188       if ((i.xstate & xstate_mmx)
9189           || i.tm.base_opcode == 0xf77 /* emms */
9190           || i.tm.base_opcode == 0xf0e /* femms */)
9191         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9192
9193       if (i.index_reg)
9194         {
9195           if (i.index_reg->reg_type.bitfield.zmmword)
9196             i.xstate |= xstate_zmm;
9197           else if (i.index_reg->reg_type.bitfield.ymmword)
9198             i.xstate |= xstate_ymm;
9199           else if (i.index_reg->reg_type.bitfield.xmmword)
9200             i.xstate |= xstate_xmm;
9201         }
9202
9203       /* vzeroall / vzeroupper */
9204       if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9205         i.xstate |= xstate_ymm;
9206
9207       if ((i.xstate & xstate_xmm)
9208           /* ldmxcsr / stmxcsr */
9209           || (i.tm.base_opcode == 0xfae && i.tm.cpu_flags.bitfield.cpusse)
9210           /* vldmxcsr / vstmxcsr */
9211           || (i.tm.base_opcode == 0xae && i.tm.cpu_flags.bitfield.cpuavx)
9212           || i.tm.cpu_flags.bitfield.cpuwidekl
9213           || i.tm.cpu_flags.bitfield.cpukl)
9214         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9215
9216       if ((i.xstate & xstate_ymm) == xstate_ymm)
9217         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9218       if ((i.xstate & xstate_zmm) == xstate_zmm)
9219         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9220       if (i.mask || (i.xstate & xstate_mask) == xstate_mask)
9221         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9222       if (i.tm.cpu_flags.bitfield.cpufxsr)
9223         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9224       if (i.tm.cpu_flags.bitfield.cpuxsave)
9225         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9226       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9227         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9228       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9229         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9230
9231       if (x86_feature_2_used
9232           || i.tm.cpu_flags.bitfield.cpucmov
9233           || i.tm.cpu_flags.bitfield.cpusyscall
9234           || (i.tm.base_opcode == 0xfc7
9235               && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
9236               && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9237         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9238       if (i.tm.cpu_flags.bitfield.cpusse3
9239           || i.tm.cpu_flags.bitfield.cpussse3
9240           || i.tm.cpu_flags.bitfield.cpusse4_1
9241           || i.tm.cpu_flags.bitfield.cpusse4_2
9242           || i.tm.cpu_flags.bitfield.cpucx16
9243           || i.tm.cpu_flags.bitfield.cpupopcnt
9244           /* LAHF-SAHF insns in 64-bit mode.  */
9245           || (flag_code == CODE_64BIT
9246               && (i.tm.base_opcode | 1) == 0x9f))
9247         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9248       if (i.tm.cpu_flags.bitfield.cpuavx
9249           || i.tm.cpu_flags.bitfield.cpuavx2
9250           /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9251              CpuAVX512DQ, LPW, TBM and AMX.  */
9252           || (i.tm.opcode_modifier.vex
9253               && !i.tm.cpu_flags.bitfield.cpuavx512f
9254               && !i.tm.cpu_flags.bitfield.cpuavx512bw
9255               && !i.tm.cpu_flags.bitfield.cpuavx512dq
9256               && !i.tm.cpu_flags.bitfield.cpulwp
9257               && !i.tm.cpu_flags.bitfield.cputbm
9258               && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9259           || i.tm.cpu_flags.bitfield.cpuf16c
9260           || i.tm.cpu_flags.bitfield.cpufma
9261           || i.tm.cpu_flags.bitfield.cpulzcnt
9262           || i.tm.cpu_flags.bitfield.cpumovbe
9263           || i.tm.cpu_flags.bitfield.cpuxsaves
9264           || (x86_feature_2_used
9265               & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9266                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9267                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9268         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9269       if (i.tm.cpu_flags.bitfield.cpuavx512f
9270           || i.tm.cpu_flags.bitfield.cpuavx512bw
9271           || i.tm.cpu_flags.bitfield.cpuavx512dq
9272           || i.tm.cpu_flags.bitfield.cpuavx512vl
9273           /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9274              VNNIW.  */
9275           || (i.tm.opcode_modifier.evex
9276               && !i.tm.cpu_flags.bitfield.cpuavx512er
9277               && !i.tm.cpu_flags.bitfield.cpuavx512pf
9278               && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9279         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9280     }
9281 #endif
9282
9283   /* Tie dwarf2 debug info to the address at the start of the insn.
9284      We can't do this after the insn has been output as the current
9285      frag may have been closed off.  eg. by frag_var.  */
9286   dwarf2_emit_insn (0);
9287
9288   insn_start_frag = frag_now;
9289   insn_start_off = frag_now_fix ();
9290
9291   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9292     {
9293       char *p;
9294       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9295       unsigned int max_branch_padding_size = 14;
9296
9297       /* Align section to boundary.  */
9298       record_alignment (now_seg, align_branch_power);
9299
9300       /* Make room for padding.  */
9301       frag_grow (max_branch_padding_size);
9302
9303       /* Start of the padding.  */
9304       p = frag_more (0);
9305
9306       fragP = frag_now;
9307
9308       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9309                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9310                 NULL, 0, p);
9311
9312       fragP->tc_frag_data.mf_type = mf_jcc;
9313       fragP->tc_frag_data.branch_type = branch;
9314       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9315     }
9316
9317   /* Output jumps.  */
9318   if (i.tm.opcode_modifier.jump == JUMP)
9319     output_branch ();
9320   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9321            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9322     output_jump ();
9323   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9324     output_interseg_jump ();
9325   else
9326     {
9327       /* Output normal instructions here.  */
9328       char *p;
9329       unsigned char *q;
9330       unsigned int j;
9331       enum mf_cmp_kind mf_cmp;
9332
9333       if (avoid_fence
9334           && (i.tm.base_opcode == 0xfaee8
9335               || i.tm.base_opcode == 0xfaef0
9336               || i.tm.base_opcode == 0xfaef8))
9337         {
9338           /* Encode lfence, mfence, and sfence as
9339              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9340           if (now_seg != absolute_section)
9341             {
9342               offsetT val = 0x240483f0ULL;
9343
9344               p = frag_more (5);
9345               md_number_to_chars (p, val, 5);
9346             }
9347           else
9348             abs_section_offset += 5;
9349           return;
9350         }
9351
9352       /* Some processors fail on LOCK prefix. This options makes
9353          assembler ignore LOCK prefix and serves as a workaround.  */
9354       if (omit_lock_prefix)
9355         {
9356           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9357             return;
9358           i.prefix[LOCK_PREFIX] = 0;
9359         }
9360
9361       if (branch)
9362         /* Skip if this is a branch.  */
9363         ;
9364       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9365         {
9366           /* Make room for padding.  */
9367           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9368           p = frag_more (0);
9369
9370           fragP = frag_now;
9371
9372           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9373                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9374                     NULL, 0, p);
9375
9376           fragP->tc_frag_data.mf_type = mf_cmp;
9377           fragP->tc_frag_data.branch_type = align_branch_fused;
9378           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9379         }
9380       else if (add_branch_prefix_frag_p ())
9381         {
9382           unsigned int max_prefix_size = align_branch_prefix_size;
9383
9384           /* Make room for padding.  */
9385           frag_grow (max_prefix_size);
9386           p = frag_more (0);
9387
9388           fragP = frag_now;
9389
9390           frag_var (rs_machine_dependent, max_prefix_size, 0,
9391                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9392                     NULL, 0, p);
9393
9394           fragP->tc_frag_data.max_bytes = max_prefix_size;
9395         }
9396
9397       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9398          don't need the explicit prefix.  */
9399       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9400         {
9401           switch (i.tm.opcode_modifier.opcodeprefix)
9402             {
9403             case PREFIX_0X66:
9404               add_prefix (0x66);
9405               break;
9406             case PREFIX_0XF2:
9407               add_prefix (0xf2);
9408               break;
9409             case PREFIX_0XF3:
9410               if (!i.tm.cpu_flags.bitfield.cpupadlock
9411                   || (i.prefix[REP_PREFIX] != 0xf3))
9412                 add_prefix (0xf3);
9413               break;
9414             case PREFIX_NONE:
9415               switch (i.tm.opcode_length)
9416                 {
9417                 case 3:
9418                 case 2:
9419                 case 1:
9420                   break;
9421                 case 0:
9422                   /* Check for pseudo prefixes.  */
9423                   as_bad_where (insn_start_frag->fr_file,
9424                                 insn_start_frag->fr_line,
9425                                 _("pseudo prefix without instruction"));
9426                   return;
9427                 default:
9428                   abort ();
9429                 }
9430               break;
9431             default:
9432               abort ();
9433             }
9434
9435 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9436           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9437              R_X86_64_GOTTPOFF relocation so that linker can safely
9438              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9439              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9440              relocation for GDesc -> IE/LE optimization.  */
9441           if (x86_elf_abi == X86_64_X32_ABI
9442               && i.operands == 2
9443               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9444                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9445               && i.prefix[REX_PREFIX] == 0)
9446             add_prefix (REX_OPCODE);
9447 #endif
9448
9449           /* The prefix bytes.  */
9450           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9451             if (*q)
9452               frag_opcode_byte (*q);
9453         }
9454       else
9455         {
9456           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9457             if (*q)
9458               switch (j)
9459                 {
9460                 case SEG_PREFIX:
9461                 case ADDR_PREFIX:
9462                   frag_opcode_byte (*q);
9463                   break;
9464                 default:
9465                   /* There should be no other prefixes for instructions
9466                      with VEX prefix.  */
9467                   abort ();
9468                 }
9469
9470           /* For EVEX instructions i.vrex should become 0 after
9471              build_evex_prefix.  For VEX instructions upper 16 registers
9472              aren't available, so VREX should be 0.  */
9473           if (i.vrex)
9474             abort ();
9475           /* Now the VEX prefix.  */
9476           if (now_seg != absolute_section)
9477             {
9478               p = frag_more (i.vex.length);
9479               for (j = 0; j < i.vex.length; j++)
9480                 p[j] = i.vex.bytes[j];
9481             }
9482           else
9483             abs_section_offset += i.vex.length;
9484         }
9485
9486       /* Now the opcode; be careful about word order here!  */
9487       if (now_seg == absolute_section)
9488         abs_section_offset += i.tm.opcode_length;
9489       else if (i.tm.opcode_length == 1)
9490         {
9491           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9492         }
9493       else
9494         {
9495           switch (i.tm.opcode_length)
9496             {
9497             case 4:
9498               p = frag_more (4);
9499               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9500               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9501               break;
9502             case 3:
9503               p = frag_more (3);
9504               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9505               break;
9506             case 2:
9507               p = frag_more (2);
9508               break;
9509             default:
9510               abort ();
9511               break;
9512             }
9513
9514           /* Put out high byte first: can't use md_number_to_chars!  */
9515           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9516           *p = i.tm.base_opcode & 0xff;
9517         }
9518
9519       /* Now the modrm byte and sib byte (if present).  */
9520       if (i.tm.opcode_modifier.modrm)
9521         {
9522           frag_opcode_byte ((i.rm.regmem << 0)
9523                              | (i.rm.reg << 3)
9524                              | (i.rm.mode << 6));
9525           /* If i.rm.regmem == ESP (4)
9526              && i.rm.mode != (Register mode)
9527              && not 16 bit
9528              ==> need second modrm byte.  */
9529           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9530               && i.rm.mode != 3
9531               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9532             frag_opcode_byte ((i.sib.base << 0)
9533                               | (i.sib.index << 3)
9534                               | (i.sib.scale << 6));
9535         }
9536
9537       if (i.disp_operands)
9538         output_disp (insn_start_frag, insn_start_off);
9539
9540       if (i.imm_operands)
9541         output_imm (insn_start_frag, insn_start_off);
9542
9543       /*
9544        * frag_now_fix () returning plain abs_section_offset when we're in the
9545        * absolute section, and abs_section_offset not getting updated as data
9546        * gets added to the frag breaks the logic below.
9547        */
9548       if (now_seg != absolute_section)
9549         {
9550           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9551           if (j > 15)
9552             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9553                      j);
9554           else if (fragP)
9555             {
9556               /* NB: Don't add prefix with GOTPC relocation since
9557                  output_disp() above depends on the fixed encoding
9558                  length.  Can't add prefix with TLS relocation since
9559                  it breaks TLS linker optimization.  */
9560               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9561               /* Prefix count on the current instruction.  */
9562               unsigned int count = i.vex.length;
9563               unsigned int k;
9564               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9565                 /* REX byte is encoded in VEX/EVEX prefix.  */
9566                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9567                   count++;
9568
9569               /* Count prefixes for extended opcode maps.  */
9570               if (!i.vex.length)
9571                 switch (i.tm.opcode_length)
9572                   {
9573                   case 3:
9574                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9575                       {
9576                         count++;
9577                         switch ((i.tm.base_opcode >> 8) & 0xff)
9578                           {
9579                           case 0x38:
9580                           case 0x3a:
9581                             count++;
9582                             break;
9583                           default:
9584                             break;
9585                           }
9586                       }
9587                     break;
9588                   case 2:
9589                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9590                       count++;
9591                     break;
9592                   case 1:
9593                     break;
9594                   default:
9595                     abort ();
9596                   }
9597
9598               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9599                   == BRANCH_PREFIX)
9600                 {
9601                   /* Set the maximum prefix size in BRANCH_PREFIX
9602                      frag.  */
9603                   if (fragP->tc_frag_data.max_bytes > max)
9604                     fragP->tc_frag_data.max_bytes = max;
9605                   if (fragP->tc_frag_data.max_bytes > count)
9606                     fragP->tc_frag_data.max_bytes -= count;
9607                   else
9608                     fragP->tc_frag_data.max_bytes = 0;
9609                 }
9610               else
9611                 {
9612                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9613                      frag.  */
9614                   unsigned int max_prefix_size;
9615                   if (align_branch_prefix_size > max)
9616                     max_prefix_size = max;
9617                   else
9618                     max_prefix_size = align_branch_prefix_size;
9619                   if (max_prefix_size > count)
9620                     fragP->tc_frag_data.max_prefix_length
9621                       = max_prefix_size - count;
9622                 }
9623
9624               /* Use existing segment prefix if possible.  Use CS
9625                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9626                  segment prefix with ESP/EBP base register and use DS
9627                  segment prefix without ESP/EBP base register.  */
9628               if (i.prefix[SEG_PREFIX])
9629                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9630               else if (flag_code == CODE_64BIT)
9631                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9632               else if (i.base_reg
9633                        && (i.base_reg->reg_num == 4
9634                            || i.base_reg->reg_num == 5))
9635                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9636               else
9637                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9638             }
9639         }
9640     }
9641
9642   /* NB: Don't work with COND_JUMP86 without i386.  */
9643   if (align_branch_power
9644       && now_seg != absolute_section
9645       && cpu_arch_flags.bitfield.cpui386)
9646     {
9647       /* Terminate each frag so that we can add prefix and check for
9648          fused jcc.  */
9649       frag_wane (frag_now);
9650       frag_new (0);
9651     }
9652
9653 #ifdef DEBUG386
9654   if (flag_debug)
9655     {
9656       pi ("" /*line*/, &i);
9657     }
9658 #endif /* DEBUG386  */
9659 }
9660
9661 /* Return the size of the displacement operand N.  */
9662
9663 static int
9664 disp_size (unsigned int n)
9665 {
9666   int size = 4;
9667
9668   if (i.types[n].bitfield.disp64)
9669     size = 8;
9670   else if (i.types[n].bitfield.disp8)
9671     size = 1;
9672   else if (i.types[n].bitfield.disp16)
9673     size = 2;
9674   return size;
9675 }
9676
9677 /* Return the size of the immediate operand N.  */
9678
9679 static int
9680 imm_size (unsigned int n)
9681 {
9682   int size = 4;
9683   if (i.types[n].bitfield.imm64)
9684     size = 8;
9685   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9686     size = 1;
9687   else if (i.types[n].bitfield.imm16)
9688     size = 2;
9689   return size;
9690 }
9691
9692 static void
9693 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9694 {
9695   char *p;
9696   unsigned int n;
9697
9698   for (n = 0; n < i.operands; n++)
9699     {
9700       if (operand_type_check (i.types[n], disp))
9701         {
9702           int size = disp_size (n);
9703
9704           if (now_seg == absolute_section)
9705             abs_section_offset += size;
9706           else if (i.op[n].disps->X_op == O_constant)
9707             {
9708               offsetT val = i.op[n].disps->X_add_number;
9709
9710               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9711                                      size);
9712               p = frag_more (size);
9713               md_number_to_chars (p, val, size);
9714             }
9715           else
9716             {
9717               enum bfd_reloc_code_real reloc_type;
9718               int sign = i.types[n].bitfield.disp32s;
9719               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9720               fixS *fixP;
9721
9722               /* We can't have 8 bit displacement here.  */
9723               gas_assert (!i.types[n].bitfield.disp8);
9724
9725               /* The PC relative address is computed relative
9726                  to the instruction boundary, so in case immediate
9727                  fields follows, we need to adjust the value.  */
9728               if (pcrel && i.imm_operands)
9729                 {
9730                   unsigned int n1;
9731                   int sz = 0;
9732
9733                   for (n1 = 0; n1 < i.operands; n1++)
9734                     if (operand_type_check (i.types[n1], imm))
9735                       {
9736                         /* Only one immediate is allowed for PC
9737                            relative address.  */
9738                         gas_assert (sz == 0);
9739                         sz = imm_size (n1);
9740                         i.op[n].disps->X_add_number -= sz;
9741                       }
9742                   /* We should find the immediate.  */
9743                   gas_assert (sz != 0);
9744                 }
9745
9746               p = frag_more (size);
9747               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9748               if (GOT_symbol
9749                   && GOT_symbol == i.op[n].disps->X_add_symbol
9750                   && (((reloc_type == BFD_RELOC_32
9751                         || reloc_type == BFD_RELOC_X86_64_32S
9752                         || (reloc_type == BFD_RELOC_64
9753                             && object_64bit))
9754                        && (i.op[n].disps->X_op == O_symbol
9755                            || (i.op[n].disps->X_op == O_add
9756                                && ((symbol_get_value_expression
9757                                     (i.op[n].disps->X_op_symbol)->X_op)
9758                                    == O_subtract))))
9759                       || reloc_type == BFD_RELOC_32_PCREL))
9760                 {
9761                   if (!object_64bit)
9762                     {
9763                       reloc_type = BFD_RELOC_386_GOTPC;
9764                       i.has_gotpc_tls_reloc = TRUE;
9765                       i.op[n].imms->X_add_number +=
9766                         encoding_length (insn_start_frag, insn_start_off, p);
9767                     }
9768                   else if (reloc_type == BFD_RELOC_64)
9769                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9770                   else
9771                     /* Don't do the adjustment for x86-64, as there
9772                        the pcrel addressing is relative to the _next_
9773                        insn, and that is taken care of in other code.  */
9774                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9775                 }
9776               else if (align_branch_power)
9777                 {
9778                   switch (reloc_type)
9779                     {
9780                     case BFD_RELOC_386_TLS_GD:
9781                     case BFD_RELOC_386_TLS_LDM:
9782                     case BFD_RELOC_386_TLS_IE:
9783                     case BFD_RELOC_386_TLS_IE_32:
9784                     case BFD_RELOC_386_TLS_GOTIE:
9785                     case BFD_RELOC_386_TLS_GOTDESC:
9786                     case BFD_RELOC_386_TLS_DESC_CALL:
9787                     case BFD_RELOC_X86_64_TLSGD:
9788                     case BFD_RELOC_X86_64_TLSLD:
9789                     case BFD_RELOC_X86_64_GOTTPOFF:
9790                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9791                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9792                       i.has_gotpc_tls_reloc = TRUE;
9793                     default:
9794                       break;
9795                     }
9796                 }
9797               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9798                                   size, i.op[n].disps, pcrel,
9799                                   reloc_type);
9800               /* Check for "call/jmp *mem", "mov mem, %reg",
9801                  "test %reg, mem" and "binop mem, %reg" where binop
9802                  is one of adc, add, and, cmp, or, sbb, sub, xor
9803                  instructions without data prefix.  Always generate
9804                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9805               if (i.prefix[DATA_PREFIX] == 0
9806                   && (generate_relax_relocations
9807                       || (!object_64bit
9808                           && i.rm.mode == 0
9809                           && i.rm.regmem == 5))
9810                   && (i.rm.mode == 2
9811                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9812                   && !is_any_vex_encoding(&i.tm)
9813                   && ((i.operands == 1
9814                        && i.tm.base_opcode == 0xff
9815                        && (i.rm.reg == 2 || i.rm.reg == 4))
9816                       || (i.operands == 2
9817                           && (i.tm.base_opcode == 0x8b
9818                               || i.tm.base_opcode == 0x85
9819                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9820                 {
9821                   if (object_64bit)
9822                     {
9823                       fixP->fx_tcbit = i.rex != 0;
9824                       if (i.base_reg
9825                           && (i.base_reg->reg_num == RegIP))
9826                       fixP->fx_tcbit2 = 1;
9827                     }
9828                   else
9829                     fixP->fx_tcbit2 = 1;
9830                 }
9831             }
9832         }
9833     }
9834 }
9835
9836 static void
9837 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9838 {
9839   char *p;
9840   unsigned int n;
9841
9842   for (n = 0; n < i.operands; n++)
9843     {
9844       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9845       if (i.rounding && (int) n == i.rounding->operand)
9846         continue;
9847
9848       if (operand_type_check (i.types[n], imm))
9849         {
9850           int size = imm_size (n);
9851
9852           if (now_seg == absolute_section)
9853             abs_section_offset += size;
9854           else if (i.op[n].imms->X_op == O_constant)
9855             {
9856               offsetT val;
9857
9858               val = offset_in_range (i.op[n].imms->X_add_number,
9859                                      size);
9860               p = frag_more (size);
9861               md_number_to_chars (p, val, size);
9862             }
9863           else
9864             {
9865               /* Not absolute_section.
9866                  Need a 32-bit fixup (don't support 8bit
9867                  non-absolute imms).  Try to support other
9868                  sizes ...  */
9869               enum bfd_reloc_code_real reloc_type;
9870               int sign;
9871
9872               if (i.types[n].bitfield.imm32s
9873                   && (i.suffix == QWORD_MNEM_SUFFIX
9874                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9875                 sign = 1;
9876               else
9877                 sign = 0;
9878
9879               p = frag_more (size);
9880               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9881
9882               /*   This is tough to explain.  We end up with this one if we
9883                * have operands that look like
9884                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9885                * obtain the absolute address of the GOT, and it is strongly
9886                * preferable from a performance point of view to avoid using
9887                * a runtime relocation for this.  The actual sequence of
9888                * instructions often look something like:
9889                *
9890                *        call    .L66
9891                * .L66:
9892                *        popl    %ebx
9893                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9894                *
9895                *   The call and pop essentially return the absolute address
9896                * of the label .L66 and store it in %ebx.  The linker itself
9897                * will ultimately change the first operand of the addl so
9898                * that %ebx points to the GOT, but to keep things simple, the
9899                * .o file must have this operand set so that it generates not
9900                * the absolute address of .L66, but the absolute address of
9901                * itself.  This allows the linker itself simply treat a GOTPC
9902                * relocation as asking for a pcrel offset to the GOT to be
9903                * added in, and the addend of the relocation is stored in the
9904                * operand field for the instruction itself.
9905                *
9906                *   Our job here is to fix the operand so that it would add
9907                * the correct offset so that %ebx would point to itself.  The
9908                * thing that is tricky is that .-.L66 will point to the
9909                * beginning of the instruction, so we need to further modify
9910                * the operand so that it will point to itself.  There are
9911                * other cases where you have something like:
9912                *
9913                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9914                *
9915                * and here no correction would be required.  Internally in
9916                * the assembler we treat operands of this form as not being
9917                * pcrel since the '.' is explicitly mentioned, and I wonder
9918                * whether it would simplify matters to do it this way.  Who
9919                * knows.  In earlier versions of the PIC patches, the
9920                * pcrel_adjust field was used to store the correction, but
9921                * since the expression is not pcrel, I felt it would be
9922                * confusing to do it this way.  */
9923
9924               if ((reloc_type == BFD_RELOC_32
9925                    || reloc_type == BFD_RELOC_X86_64_32S
9926                    || reloc_type == BFD_RELOC_64)
9927                   && GOT_symbol
9928                   && GOT_symbol == i.op[n].imms->X_add_symbol
9929                   && (i.op[n].imms->X_op == O_symbol
9930                       || (i.op[n].imms->X_op == O_add
9931                           && ((symbol_get_value_expression
9932                                (i.op[n].imms->X_op_symbol)->X_op)
9933                               == O_subtract))))
9934                 {
9935                   if (!object_64bit)
9936                     reloc_type = BFD_RELOC_386_GOTPC;
9937                   else if (size == 4)
9938                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9939                   else if (size == 8)
9940                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9941                   i.has_gotpc_tls_reloc = TRUE;
9942                   i.op[n].imms->X_add_number +=
9943                     encoding_length (insn_start_frag, insn_start_off, p);
9944                 }
9945               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9946                            i.op[n].imms, 0, reloc_type);
9947             }
9948         }
9949     }
9950 }
9951 \f
9952 /* x86_cons_fix_new is called via the expression parsing code when a
9953    reloc is needed.  We use this hook to get the correct .got reloc.  */
9954 static int cons_sign = -1;
9955
9956 void
9957 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9958                   expressionS *exp, bfd_reloc_code_real_type r)
9959 {
9960   r = reloc (len, 0, cons_sign, r);
9961
9962 #ifdef TE_PE
9963   if (exp->X_op == O_secrel)
9964     {
9965       exp->X_op = O_symbol;
9966       r = BFD_RELOC_32_SECREL;
9967     }
9968 #endif
9969
9970   fix_new_exp (frag, off, len, exp, 0, r);
9971 }
9972
9973 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9974    purpose of the `.dc.a' internal pseudo-op.  */
9975
9976 int
9977 x86_address_bytes (void)
9978 {
9979   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9980     return 4;
9981   return stdoutput->arch_info->bits_per_address / 8;
9982 }
9983
9984 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9985     || defined (LEX_AT)
9986 # define lex_got(reloc, adjust, types) NULL
9987 #else
9988 /* Parse operands of the form
9989    <symbol>@GOTOFF+<nnn>
9990    and similar .plt or .got references.
9991
9992    If we find one, set up the correct relocation in RELOC and copy the
9993    input string, minus the `@GOTOFF' into a malloc'd buffer for
9994    parsing by the calling routine.  Return this buffer, and if ADJUST
9995    is non-null set it to the length of the string we removed from the
9996    input line.  Otherwise return NULL.  */
9997 static char *
9998 lex_got (enum bfd_reloc_code_real *rel,
9999          int *adjust,
10000          i386_operand_type *types)
10001 {
10002   /* Some of the relocations depend on the size of what field is to
10003      be relocated.  But in our callers i386_immediate and i386_displacement
10004      we don't yet know the operand size (this will be set by insn
10005      matching).  Hence we record the word32 relocation here,
10006      and adjust the reloc according to the real size in reloc().  */
10007   static const struct {
10008     const char *str;
10009     int len;
10010     const enum bfd_reloc_code_real rel[2];
10011     const i386_operand_type types64;
10012     bfd_boolean need_GOT_symbol;
10013   } gotrel[] = {
10014 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10015     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
10016                                         BFD_RELOC_SIZE32 },
10017       OPERAND_TYPE_IMM32_64, FALSE },
10018 #endif
10019     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
10020                                        BFD_RELOC_X86_64_PLTOFF64 },
10021       OPERAND_TYPE_IMM64, TRUE },
10022     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
10023                                        BFD_RELOC_X86_64_PLT32    },
10024       OPERAND_TYPE_IMM32_32S_DISP32, FALSE },
10025     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
10026                                        BFD_RELOC_X86_64_GOTPLT64 },
10027       OPERAND_TYPE_IMM64_DISP64, TRUE },
10028     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
10029                                        BFD_RELOC_X86_64_GOTOFF64 },
10030       OPERAND_TYPE_IMM64_DISP64, TRUE },
10031     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10032                                        BFD_RELOC_X86_64_GOTPCREL },
10033       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10034     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
10035                                        BFD_RELOC_X86_64_TLSGD    },
10036       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10037     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
10038                                        _dummy_first_bfd_reloc_code_real },
10039       OPERAND_TYPE_NONE, TRUE },
10040     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
10041                                        BFD_RELOC_X86_64_TLSLD    },
10042       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10043     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10044                                        BFD_RELOC_X86_64_GOTTPOFF },
10045       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10046     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
10047                                        BFD_RELOC_X86_64_TPOFF32  },
10048       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10049     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
10050                                        _dummy_first_bfd_reloc_code_real },
10051       OPERAND_TYPE_NONE, TRUE },
10052     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
10053                                        BFD_RELOC_X86_64_DTPOFF32 },
10054       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10055     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10056                                        _dummy_first_bfd_reloc_code_real },
10057       OPERAND_TYPE_NONE, TRUE },
10058     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10059                                        _dummy_first_bfd_reloc_code_real },
10060       OPERAND_TYPE_NONE, TRUE },
10061     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
10062                                        BFD_RELOC_X86_64_GOT32    },
10063       OPERAND_TYPE_IMM32_32S_64_DISP32, TRUE },
10064     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10065                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10066       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10067     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10068                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10069       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10070   };
10071   char *cp;
10072   unsigned int j;
10073
10074 #if defined (OBJ_MAYBE_ELF)
10075   if (!IS_ELF)
10076     return NULL;
10077 #endif
10078
10079   for (cp = input_line_pointer; *cp != '@'; cp++)
10080     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10081       return NULL;
10082
10083   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10084     {
10085       int len = gotrel[j].len;
10086       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10087         {
10088           if (gotrel[j].rel[object_64bit] != 0)
10089             {
10090               int first, second;
10091               char *tmpbuf, *past_reloc;
10092
10093               *rel = gotrel[j].rel[object_64bit];
10094
10095               if (types)
10096                 {
10097                   if (flag_code != CODE_64BIT)
10098                     {
10099                       types->bitfield.imm32 = 1;
10100                       types->bitfield.disp32 = 1;
10101                     }
10102                   else
10103                     *types = gotrel[j].types64;
10104                 }
10105
10106               if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10107                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10108
10109               /* The length of the first part of our input line.  */
10110               first = cp - input_line_pointer;
10111
10112               /* The second part goes from after the reloc token until
10113                  (and including) an end_of_line char or comma.  */
10114               past_reloc = cp + 1 + len;
10115               cp = past_reloc;
10116               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10117                 ++cp;
10118               second = cp + 1 - past_reloc;
10119
10120               /* Allocate and copy string.  The trailing NUL shouldn't
10121                  be necessary, but be safe.  */
10122               tmpbuf = XNEWVEC (char, first + second + 2);
10123               memcpy (tmpbuf, input_line_pointer, first);
10124               if (second != 0 && *past_reloc != ' ')
10125                 /* Replace the relocation token with ' ', so that
10126                    errors like foo@GOTOFF1 will be detected.  */
10127                 tmpbuf[first++] = ' ';
10128               else
10129                 /* Increment length by 1 if the relocation token is
10130                    removed.  */
10131                 len++;
10132               if (adjust)
10133                 *adjust = len;
10134               memcpy (tmpbuf + first, past_reloc, second);
10135               tmpbuf[first + second] = '\0';
10136               return tmpbuf;
10137             }
10138
10139           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10140                   gotrel[j].str, 1 << (5 + object_64bit));
10141           return NULL;
10142         }
10143     }
10144
10145   /* Might be a symbol version string.  Don't as_bad here.  */
10146   return NULL;
10147 }
10148 #endif
10149
10150 #ifdef TE_PE
10151 #ifdef lex_got
10152 #undef lex_got
10153 #endif
10154 /* Parse operands of the form
10155    <symbol>@SECREL32+<nnn>
10156
10157    If we find one, set up the correct relocation in RELOC and copy the
10158    input string, minus the `@SECREL32' into a malloc'd buffer for
10159    parsing by the calling routine.  Return this buffer, and if ADJUST
10160    is non-null set it to the length of the string we removed from the
10161    input line.  Otherwise return NULL.
10162
10163    This function is copied from the ELF version above adjusted for PE targets.  */
10164
10165 static char *
10166 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10167          int *adjust ATTRIBUTE_UNUSED,
10168          i386_operand_type *types)
10169 {
10170   static const struct
10171   {
10172     const char *str;
10173     int len;
10174     const enum bfd_reloc_code_real rel[2];
10175     const i386_operand_type types64;
10176   }
10177   gotrel[] =
10178   {
10179     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10180                                           BFD_RELOC_32_SECREL },
10181       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10182   };
10183
10184   char *cp;
10185   unsigned j;
10186
10187   for (cp = input_line_pointer; *cp != '@'; cp++)
10188     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10189       return NULL;
10190
10191   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10192     {
10193       int len = gotrel[j].len;
10194
10195       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10196         {
10197           if (gotrel[j].rel[object_64bit] != 0)
10198             {
10199               int first, second;
10200               char *tmpbuf, *past_reloc;
10201
10202               *rel = gotrel[j].rel[object_64bit];
10203               if (adjust)
10204                 *adjust = len;
10205
10206               if (types)
10207                 {
10208                   if (flag_code != CODE_64BIT)
10209                     {
10210                       types->bitfield.imm32 = 1;
10211                       types->bitfield.disp32 = 1;
10212                     }
10213                   else
10214                     *types = gotrel[j].types64;
10215                 }
10216
10217               /* The length of the first part of our input line.  */
10218               first = cp - input_line_pointer;
10219
10220               /* The second part goes from after the reloc token until
10221                  (and including) an end_of_line char or comma.  */
10222               past_reloc = cp + 1 + len;
10223               cp = past_reloc;
10224               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10225                 ++cp;
10226               second = cp + 1 - past_reloc;
10227
10228               /* Allocate and copy string.  The trailing NUL shouldn't
10229                  be necessary, but be safe.  */
10230               tmpbuf = XNEWVEC (char, first + second + 2);
10231               memcpy (tmpbuf, input_line_pointer, first);
10232               if (second != 0 && *past_reloc != ' ')
10233                 /* Replace the relocation token with ' ', so that
10234                    errors like foo@SECLREL321 will be detected.  */
10235                 tmpbuf[first++] = ' ';
10236               memcpy (tmpbuf + first, past_reloc, second);
10237               tmpbuf[first + second] = '\0';
10238               return tmpbuf;
10239             }
10240
10241           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10242                   gotrel[j].str, 1 << (5 + object_64bit));
10243           return NULL;
10244         }
10245     }
10246
10247   /* Might be a symbol version string.  Don't as_bad here.  */
10248   return NULL;
10249 }
10250
10251 #endif /* TE_PE */
10252
10253 bfd_reloc_code_real_type
10254 x86_cons (expressionS *exp, int size)
10255 {
10256   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10257
10258   intel_syntax = -intel_syntax;
10259
10260   exp->X_md = 0;
10261   if (size == 4 || (object_64bit && size == 8))
10262     {
10263       /* Handle @GOTOFF and the like in an expression.  */
10264       char *save;
10265       char *gotfree_input_line;
10266       int adjust = 0;
10267
10268       save = input_line_pointer;
10269       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10270       if (gotfree_input_line)
10271         input_line_pointer = gotfree_input_line;
10272
10273       expression (exp);
10274
10275       if (gotfree_input_line)
10276         {
10277           /* expression () has merrily parsed up to the end of line,
10278              or a comma - in the wrong buffer.  Transfer how far
10279              input_line_pointer has moved to the right buffer.  */
10280           input_line_pointer = (save
10281                                 + (input_line_pointer - gotfree_input_line)
10282                                 + adjust);
10283           free (gotfree_input_line);
10284           if (exp->X_op == O_constant
10285               || exp->X_op == O_absent
10286               || exp->X_op == O_illegal
10287               || exp->X_op == O_register
10288               || exp->X_op == O_big)
10289             {
10290               char c = *input_line_pointer;
10291               *input_line_pointer = 0;
10292               as_bad (_("missing or invalid expression `%s'"), save);
10293               *input_line_pointer = c;
10294             }
10295           else if ((got_reloc == BFD_RELOC_386_PLT32
10296                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10297                    && exp->X_op != O_symbol)
10298             {
10299               char c = *input_line_pointer;
10300               *input_line_pointer = 0;
10301               as_bad (_("invalid PLT expression `%s'"), save);
10302               *input_line_pointer = c;
10303             }
10304         }
10305     }
10306   else
10307     expression (exp);
10308
10309   intel_syntax = -intel_syntax;
10310
10311   if (intel_syntax)
10312     i386_intel_simplify (exp);
10313
10314   return got_reloc;
10315 }
10316
10317 static void
10318 signed_cons (int size)
10319 {
10320   if (flag_code == CODE_64BIT)
10321     cons_sign = 1;
10322   cons (size);
10323   cons_sign = -1;
10324 }
10325
10326 #ifdef TE_PE
10327 static void
10328 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10329 {
10330   expressionS exp;
10331
10332   do
10333     {
10334       expression (&exp);
10335       if (exp.X_op == O_symbol)
10336         exp.X_op = O_secrel;
10337
10338       emit_expr (&exp, 4);
10339     }
10340   while (*input_line_pointer++ == ',');
10341
10342   input_line_pointer--;
10343   demand_empty_rest_of_line ();
10344 }
10345 #endif
10346
10347 /* Handle Vector operations.  */
10348
10349 static char *
10350 check_VecOperations (char *op_string, char *op_end)
10351 {
10352   const reg_entry *mask;
10353   const char *saved;
10354   char *end_op;
10355
10356   while (*op_string
10357          && (op_end == NULL || op_string < op_end))
10358     {
10359       saved = op_string;
10360       if (*op_string == '{')
10361         {
10362           op_string++;
10363
10364           /* Check broadcasts.  */
10365           if (strncmp (op_string, "1to", 3) == 0)
10366             {
10367               int bcst_type;
10368
10369               if (i.broadcast)
10370                 goto duplicated_vec_op;
10371
10372               op_string += 3;
10373               if (*op_string == '8')
10374                 bcst_type = 8;
10375               else if (*op_string == '4')
10376                 bcst_type = 4;
10377               else if (*op_string == '2')
10378                 bcst_type = 2;
10379               else if (*op_string == '1'
10380                        && *(op_string+1) == '6')
10381                 {
10382                   bcst_type = 16;
10383                   op_string++;
10384                 }
10385               else
10386                 {
10387                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10388                   return NULL;
10389                 }
10390               op_string++;
10391
10392               broadcast_op.type = bcst_type;
10393               broadcast_op.operand = this_operand;
10394               broadcast_op.bytes = 0;
10395               i.broadcast = &broadcast_op;
10396             }
10397           /* Check masking operation.  */
10398           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10399             {
10400               if (mask == &bad_reg)
10401                 return NULL;
10402
10403               /* k0 can't be used for write mask.  */
10404               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10405                 {
10406                   as_bad (_("`%s%s' can't be used for write mask"),
10407                           register_prefix, mask->reg_name);
10408                   return NULL;
10409                 }
10410
10411               if (!i.mask)
10412                 {
10413                   mask_op.mask = mask;
10414                   mask_op.zeroing = 0;
10415                   mask_op.operand = this_operand;
10416                   i.mask = &mask_op;
10417                 }
10418               else
10419                 {
10420                   if (i.mask->mask)
10421                     goto duplicated_vec_op;
10422
10423                   i.mask->mask = mask;
10424
10425                   /* Only "{z}" is allowed here.  No need to check
10426                      zeroing mask explicitly.  */
10427                   if (i.mask->operand != this_operand)
10428                     {
10429                       as_bad (_("invalid write mask `%s'"), saved);
10430                       return NULL;
10431                     }
10432                 }
10433
10434               op_string = end_op;
10435             }
10436           /* Check zeroing-flag for masking operation.  */
10437           else if (*op_string == 'z')
10438             {
10439               if (!i.mask)
10440                 {
10441                   mask_op.mask = NULL;
10442                   mask_op.zeroing = 1;
10443                   mask_op.operand = this_operand;
10444                   i.mask = &mask_op;
10445                 }
10446               else
10447                 {
10448                   if (i.mask->zeroing)
10449                     {
10450                     duplicated_vec_op:
10451                       as_bad (_("duplicated `%s'"), saved);
10452                       return NULL;
10453                     }
10454
10455                   i.mask->zeroing = 1;
10456
10457                   /* Only "{%k}" is allowed here.  No need to check mask
10458                      register explicitly.  */
10459                   if (i.mask->operand != this_operand)
10460                     {
10461                       as_bad (_("invalid zeroing-masking `%s'"),
10462                               saved);
10463                       return NULL;
10464                     }
10465                 }
10466
10467               op_string++;
10468             }
10469           else
10470             goto unknown_vec_op;
10471
10472           if (*op_string != '}')
10473             {
10474               as_bad (_("missing `}' in `%s'"), saved);
10475               return NULL;
10476             }
10477           op_string++;
10478
10479           /* Strip whitespace since the addition of pseudo prefixes
10480              changed how the scrubber treats '{'.  */
10481           if (is_space_char (*op_string))
10482             ++op_string;
10483
10484           continue;
10485         }
10486     unknown_vec_op:
10487       /* We don't know this one.  */
10488       as_bad (_("unknown vector operation: `%s'"), saved);
10489       return NULL;
10490     }
10491
10492   if (i.mask && i.mask->zeroing && !i.mask->mask)
10493     {
10494       as_bad (_("zeroing-masking only allowed with write mask"));
10495       return NULL;
10496     }
10497
10498   return op_string;
10499 }
10500
10501 static int
10502 i386_immediate (char *imm_start)
10503 {
10504   char *save_input_line_pointer;
10505   char *gotfree_input_line;
10506   segT exp_seg = 0;
10507   expressionS *exp;
10508   i386_operand_type types;
10509
10510   operand_type_set (&types, ~0);
10511
10512   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10513     {
10514       as_bad (_("at most %d immediate operands are allowed"),
10515               MAX_IMMEDIATE_OPERANDS);
10516       return 0;
10517     }
10518
10519   exp = &im_expressions[i.imm_operands++];
10520   i.op[this_operand].imms = exp;
10521
10522   if (is_space_char (*imm_start))
10523     ++imm_start;
10524
10525   save_input_line_pointer = input_line_pointer;
10526   input_line_pointer = imm_start;
10527
10528   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10529   if (gotfree_input_line)
10530     input_line_pointer = gotfree_input_line;
10531
10532   exp_seg = expression (exp);
10533
10534   SKIP_WHITESPACE ();
10535
10536   /* Handle vector operations.  */
10537   if (*input_line_pointer == '{')
10538     {
10539       input_line_pointer = check_VecOperations (input_line_pointer,
10540                                                 NULL);
10541       if (input_line_pointer == NULL)
10542         return 0;
10543     }
10544
10545   if (*input_line_pointer)
10546     as_bad (_("junk `%s' after expression"), input_line_pointer);
10547
10548   input_line_pointer = save_input_line_pointer;
10549   if (gotfree_input_line)
10550     {
10551       free (gotfree_input_line);
10552
10553       if (exp->X_op == O_constant || exp->X_op == O_register)
10554         exp->X_op = O_illegal;
10555     }
10556
10557   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10558 }
10559
10560 static int
10561 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10562                          i386_operand_type types, const char *imm_start)
10563 {
10564   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10565     {
10566       if (imm_start)
10567         as_bad (_("missing or invalid immediate expression `%s'"),
10568                 imm_start);
10569       return 0;
10570     }
10571   else if (exp->X_op == O_constant)
10572     {
10573       /* Size it properly later.  */
10574       i.types[this_operand].bitfield.imm64 = 1;
10575       /* If not 64bit, sign extend val.  */
10576       if (flag_code != CODE_64BIT
10577           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10578         exp->X_add_number
10579           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10580     }
10581 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10582   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10583            && exp_seg != absolute_section
10584            && exp_seg != text_section
10585            && exp_seg != data_section
10586            && exp_seg != bss_section
10587            && exp_seg != undefined_section
10588            && !bfd_is_com_section (exp_seg))
10589     {
10590       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10591       return 0;
10592     }
10593 #endif
10594   else if (!intel_syntax && exp_seg == reg_section)
10595     {
10596       if (imm_start)
10597         as_bad (_("illegal immediate register operand %s"), imm_start);
10598       return 0;
10599     }
10600   else
10601     {
10602       /* This is an address.  The size of the address will be
10603          determined later, depending on destination register,
10604          suffix, or the default for the section.  */
10605       i.types[this_operand].bitfield.imm8 = 1;
10606       i.types[this_operand].bitfield.imm16 = 1;
10607       i.types[this_operand].bitfield.imm32 = 1;
10608       i.types[this_operand].bitfield.imm32s = 1;
10609       i.types[this_operand].bitfield.imm64 = 1;
10610       i.types[this_operand] = operand_type_and (i.types[this_operand],
10611                                                 types);
10612     }
10613
10614   return 1;
10615 }
10616
10617 static char *
10618 i386_scale (char *scale)
10619 {
10620   offsetT val;
10621   char *save = input_line_pointer;
10622
10623   input_line_pointer = scale;
10624   val = get_absolute_expression ();
10625
10626   switch (val)
10627     {
10628     case 1:
10629       i.log2_scale_factor = 0;
10630       break;
10631     case 2:
10632       i.log2_scale_factor = 1;
10633       break;
10634     case 4:
10635       i.log2_scale_factor = 2;
10636       break;
10637     case 8:
10638       i.log2_scale_factor = 3;
10639       break;
10640     default:
10641       {
10642         char sep = *input_line_pointer;
10643
10644         *input_line_pointer = '\0';
10645         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10646                 scale);
10647         *input_line_pointer = sep;
10648         input_line_pointer = save;
10649         return NULL;
10650       }
10651     }
10652   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10653     {
10654       as_warn (_("scale factor of %d without an index register"),
10655                1 << i.log2_scale_factor);
10656       i.log2_scale_factor = 0;
10657     }
10658   scale = input_line_pointer;
10659   input_line_pointer = save;
10660   return scale;
10661 }
10662
10663 static int
10664 i386_displacement (char *disp_start, char *disp_end)
10665 {
10666   expressionS *exp;
10667   segT exp_seg = 0;
10668   char *save_input_line_pointer;
10669   char *gotfree_input_line;
10670   int override;
10671   i386_operand_type bigdisp, types = anydisp;
10672   int ret;
10673
10674   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10675     {
10676       as_bad (_("at most %d displacement operands are allowed"),
10677               MAX_MEMORY_OPERANDS);
10678       return 0;
10679     }
10680
10681   operand_type_set (&bigdisp, 0);
10682   if (i.jumpabsolute
10683       || i.types[this_operand].bitfield.baseindex
10684       || (current_templates->start->opcode_modifier.jump != JUMP
10685           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10686     {
10687       i386_addressing_mode ();
10688       override = (i.prefix[ADDR_PREFIX] != 0);
10689       if (flag_code == CODE_64BIT)
10690         {
10691           if (!override)
10692             {
10693               bigdisp.bitfield.disp32s = 1;
10694               bigdisp.bitfield.disp64 = 1;
10695             }
10696           else
10697             bigdisp.bitfield.disp32 = 1;
10698         }
10699       else if ((flag_code == CODE_16BIT) ^ override)
10700           bigdisp.bitfield.disp16 = 1;
10701       else
10702           bigdisp.bitfield.disp32 = 1;
10703     }
10704   else
10705     {
10706       /* For PC-relative branches, the width of the displacement may be
10707          dependent upon data size, but is never dependent upon address size.
10708          Also make sure to not unintentionally match against a non-PC-relative
10709          branch template.  */
10710       static templates aux_templates;
10711       const insn_template *t = current_templates->start;
10712       bfd_boolean has_intel64 = FALSE;
10713
10714       aux_templates.start = t;
10715       while (++t < current_templates->end)
10716         {
10717           if (t->opcode_modifier.jump
10718               != current_templates->start->opcode_modifier.jump)
10719             break;
10720           if ((t->opcode_modifier.isa64 >= INTEL64))
10721             has_intel64 = TRUE;
10722         }
10723       if (t < current_templates->end)
10724         {
10725           aux_templates.end = t;
10726           current_templates = &aux_templates;
10727         }
10728
10729       override = (i.prefix[DATA_PREFIX] != 0);
10730       if (flag_code == CODE_64BIT)
10731         {
10732           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10733               && (!intel64 || !has_intel64))
10734             bigdisp.bitfield.disp16 = 1;
10735           else
10736             bigdisp.bitfield.disp32s = 1;
10737         }
10738       else
10739         {
10740           if (!override)
10741             override = (i.suffix == (flag_code != CODE_16BIT
10742                                      ? WORD_MNEM_SUFFIX
10743                                      : LONG_MNEM_SUFFIX));
10744           bigdisp.bitfield.disp32 = 1;
10745           if ((flag_code == CODE_16BIT) ^ override)
10746             {
10747               bigdisp.bitfield.disp32 = 0;
10748               bigdisp.bitfield.disp16 = 1;
10749             }
10750         }
10751     }
10752   i.types[this_operand] = operand_type_or (i.types[this_operand],
10753                                            bigdisp);
10754
10755   exp = &disp_expressions[i.disp_operands];
10756   i.op[this_operand].disps = exp;
10757   i.disp_operands++;
10758   save_input_line_pointer = input_line_pointer;
10759   input_line_pointer = disp_start;
10760   END_STRING_AND_SAVE (disp_end);
10761
10762 #ifndef GCC_ASM_O_HACK
10763 #define GCC_ASM_O_HACK 0
10764 #endif
10765 #if GCC_ASM_O_HACK
10766   END_STRING_AND_SAVE (disp_end + 1);
10767   if (i.types[this_operand].bitfield.baseIndex
10768       && displacement_string_end[-1] == '+')
10769     {
10770       /* This hack is to avoid a warning when using the "o"
10771          constraint within gcc asm statements.
10772          For instance:
10773
10774          #define _set_tssldt_desc(n,addr,limit,type) \
10775          __asm__ __volatile__ ( \
10776          "movw %w2,%0\n\t" \
10777          "movw %w1,2+%0\n\t" \
10778          "rorl $16,%1\n\t" \
10779          "movb %b1,4+%0\n\t" \
10780          "movb %4,5+%0\n\t" \
10781          "movb $0,6+%0\n\t" \
10782          "movb %h1,7+%0\n\t" \
10783          "rorl $16,%1" \
10784          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10785
10786          This works great except that the output assembler ends
10787          up looking a bit weird if it turns out that there is
10788          no offset.  You end up producing code that looks like:
10789
10790          #APP
10791          movw $235,(%eax)
10792          movw %dx,2+(%eax)
10793          rorl $16,%edx
10794          movb %dl,4+(%eax)
10795          movb $137,5+(%eax)
10796          movb $0,6+(%eax)
10797          movb %dh,7+(%eax)
10798          rorl $16,%edx
10799          #NO_APP
10800
10801          So here we provide the missing zero.  */
10802
10803       *displacement_string_end = '0';
10804     }
10805 #endif
10806   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10807   if (gotfree_input_line)
10808     input_line_pointer = gotfree_input_line;
10809
10810   exp_seg = expression (exp);
10811
10812   SKIP_WHITESPACE ();
10813   if (*input_line_pointer)
10814     as_bad (_("junk `%s' after expression"), input_line_pointer);
10815 #if GCC_ASM_O_HACK
10816   RESTORE_END_STRING (disp_end + 1);
10817 #endif
10818   input_line_pointer = save_input_line_pointer;
10819   if (gotfree_input_line)
10820     {
10821       free (gotfree_input_line);
10822
10823       if (exp->X_op == O_constant || exp->X_op == O_register)
10824         exp->X_op = O_illegal;
10825     }
10826
10827   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10828
10829   RESTORE_END_STRING (disp_end);
10830
10831   return ret;
10832 }
10833
10834 static int
10835 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10836                             i386_operand_type types, const char *disp_start)
10837 {
10838   i386_operand_type bigdisp;
10839   int ret = 1;
10840
10841   /* We do this to make sure that the section symbol is in
10842      the symbol table.  We will ultimately change the relocation
10843      to be relative to the beginning of the section.  */
10844   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10845       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10846       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10847     {
10848       if (exp->X_op != O_symbol)
10849         goto inv_disp;
10850
10851       if (S_IS_LOCAL (exp->X_add_symbol)
10852           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10853           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10854         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10855       exp->X_op = O_subtract;
10856       exp->X_op_symbol = GOT_symbol;
10857       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10858         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10859       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10860         i.reloc[this_operand] = BFD_RELOC_64;
10861       else
10862         i.reloc[this_operand] = BFD_RELOC_32;
10863     }
10864
10865   else if (exp->X_op == O_absent
10866            || exp->X_op == O_illegal
10867            || exp->X_op == O_big)
10868     {
10869     inv_disp:
10870       as_bad (_("missing or invalid displacement expression `%s'"),
10871               disp_start);
10872       ret = 0;
10873     }
10874
10875   else if (flag_code == CODE_64BIT
10876            && !i.prefix[ADDR_PREFIX]
10877            && exp->X_op == O_constant)
10878     {
10879       /* Since displacement is signed extended to 64bit, don't allow
10880          disp32 and turn off disp32s if they are out of range.  */
10881       i.types[this_operand].bitfield.disp32 = 0;
10882       if (!fits_in_signed_long (exp->X_add_number))
10883         {
10884           i.types[this_operand].bitfield.disp32s = 0;
10885           if (i.types[this_operand].bitfield.baseindex)
10886             {
10887               as_bad (_("0x%lx out range of signed 32bit displacement"),
10888                       (long) exp->X_add_number);
10889               ret = 0;
10890             }
10891         }
10892     }
10893
10894 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10895   else if (exp->X_op != O_constant
10896            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10897            && exp_seg != absolute_section
10898            && exp_seg != text_section
10899            && exp_seg != data_section
10900            && exp_seg != bss_section
10901            && exp_seg != undefined_section
10902            && !bfd_is_com_section (exp_seg))
10903     {
10904       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10905       ret = 0;
10906     }
10907 #endif
10908
10909   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10910       /* Constants get taken care of by optimize_disp().  */
10911       && exp->X_op != O_constant)
10912     i.types[this_operand].bitfield.disp8 = 1;
10913
10914   /* Check if this is a displacement only operand.  */
10915   bigdisp = i.types[this_operand];
10916   bigdisp.bitfield.disp8 = 0;
10917   bigdisp.bitfield.disp16 = 0;
10918   bigdisp.bitfield.disp32 = 0;
10919   bigdisp.bitfield.disp32s = 0;
10920   bigdisp.bitfield.disp64 = 0;
10921   if (operand_type_all_zero (&bigdisp))
10922     i.types[this_operand] = operand_type_and (i.types[this_operand],
10923                                               types);
10924
10925   return ret;
10926 }
10927
10928 /* Return the active addressing mode, taking address override and
10929    registers forming the address into consideration.  Update the
10930    address override prefix if necessary.  */
10931
10932 static enum flag_code
10933 i386_addressing_mode (void)
10934 {
10935   enum flag_code addr_mode;
10936
10937   if (i.prefix[ADDR_PREFIX])
10938     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10939   else if (flag_code == CODE_16BIT
10940            && current_templates->start->cpu_flags.bitfield.cpumpx
10941            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10942               from md_assemble() by "is not a valid base/index expression"
10943               when there is a base and/or index.  */
10944            && !i.types[this_operand].bitfield.baseindex)
10945     {
10946       /* MPX insn memory operands with neither base nor index must be forced
10947          to use 32-bit addressing in 16-bit mode.  */
10948       addr_mode = CODE_32BIT;
10949       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10950       ++i.prefixes;
10951       gas_assert (!i.types[this_operand].bitfield.disp16);
10952       gas_assert (!i.types[this_operand].bitfield.disp32);
10953     }
10954   else
10955     {
10956       addr_mode = flag_code;
10957
10958 #if INFER_ADDR_PREFIX
10959       if (i.mem_operands == 0)
10960         {
10961           /* Infer address prefix from the first memory operand.  */
10962           const reg_entry *addr_reg = i.base_reg;
10963
10964           if (addr_reg == NULL)
10965             addr_reg = i.index_reg;
10966
10967           if (addr_reg)
10968             {
10969               if (addr_reg->reg_type.bitfield.dword)
10970                 addr_mode = CODE_32BIT;
10971               else if (flag_code != CODE_64BIT
10972                        && addr_reg->reg_type.bitfield.word)
10973                 addr_mode = CODE_16BIT;
10974
10975               if (addr_mode != flag_code)
10976                 {
10977                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10978                   i.prefixes += 1;
10979                   /* Change the size of any displacement too.  At most one
10980                      of Disp16 or Disp32 is set.
10981                      FIXME.  There doesn't seem to be any real need for
10982                      separate Disp16 and Disp32 flags.  The same goes for
10983                      Imm16 and Imm32.  Removing them would probably clean
10984                      up the code quite a lot.  */
10985                   if (flag_code != CODE_64BIT
10986                       && (i.types[this_operand].bitfield.disp16
10987                           || i.types[this_operand].bitfield.disp32))
10988                     i.types[this_operand]
10989                       = operand_type_xor (i.types[this_operand], disp16_32);
10990                 }
10991             }
10992         }
10993 #endif
10994     }
10995
10996   return addr_mode;
10997 }
10998
10999 /* Make sure the memory operand we've been dealt is valid.
11000    Return 1 on success, 0 on a failure.  */
11001
11002 static int
11003 i386_index_check (const char *operand_string)
11004 {
11005   const char *kind = "base/index";
11006   enum flag_code addr_mode = i386_addressing_mode ();
11007   const insn_template *t = current_templates->start;
11008
11009   if (t->opcode_modifier.isstring
11010       && !t->cpu_flags.bitfield.cpupadlock
11011       && (current_templates->end[-1].opcode_modifier.isstring
11012           || i.mem_operands))
11013     {
11014       /* Memory operands of string insns are special in that they only allow
11015          a single register (rDI, rSI, or rBX) as their memory address.  */
11016       const reg_entry *expected_reg;
11017       static const char *di_si[][2] =
11018         {
11019           { "esi", "edi" },
11020           { "si", "di" },
11021           { "rsi", "rdi" }
11022         };
11023       static const char *bx[] = { "ebx", "bx", "rbx" };
11024
11025       kind = "string address";
11026
11027       if (t->opcode_modifier.prefixok == PrefixRep)
11028         {
11029           int es_op = current_templates->end[-1].opcode_modifier.isstring
11030                       - IS_STRING_ES_OP0;
11031           int op = 0;
11032
11033           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11034               || ((!i.mem_operands != !intel_syntax)
11035                   && current_templates->end[-1].operand_types[1]
11036                      .bitfield.baseindex))
11037             op = 1;
11038           expected_reg
11039             = (const reg_entry *) str_hash_find (reg_hash,
11040                                                  di_si[addr_mode][op == es_op]);
11041         }
11042       else
11043         expected_reg
11044           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11045
11046       if (i.base_reg != expected_reg
11047           || i.index_reg
11048           || operand_type_check (i.types[this_operand], disp))
11049         {
11050           /* The second memory operand must have the same size as
11051              the first one.  */
11052           if (i.mem_operands
11053               && i.base_reg
11054               && !((addr_mode == CODE_64BIT
11055                     && i.base_reg->reg_type.bitfield.qword)
11056                    || (addr_mode == CODE_32BIT
11057                        ? i.base_reg->reg_type.bitfield.dword
11058                        : i.base_reg->reg_type.bitfield.word)))
11059             goto bad_address;
11060
11061           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11062                    operand_string,
11063                    intel_syntax ? '[' : '(',
11064                    register_prefix,
11065                    expected_reg->reg_name,
11066                    intel_syntax ? ']' : ')');
11067           return 1;
11068         }
11069       else
11070         return 1;
11071
11072     bad_address:
11073       as_bad (_("`%s' is not a valid %s expression"),
11074               operand_string, kind);
11075       return 0;
11076     }
11077   else
11078     {
11079       if (addr_mode != CODE_16BIT)
11080         {
11081           /* 32-bit/64-bit checks.  */
11082           if (i.disp_encoding == disp_encoding_16bit)
11083             {
11084             bad_disp:
11085               as_bad (_("invalid `%s' prefix"),
11086                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11087               return 0;
11088             }
11089
11090           if ((i.base_reg
11091                && ((addr_mode == CODE_64BIT
11092                     ? !i.base_reg->reg_type.bitfield.qword
11093                     : !i.base_reg->reg_type.bitfield.dword)
11094                    || (i.index_reg && i.base_reg->reg_num == RegIP)
11095                    || i.base_reg->reg_num == RegIZ))
11096               || (i.index_reg
11097                   && !i.index_reg->reg_type.bitfield.xmmword
11098                   && !i.index_reg->reg_type.bitfield.ymmword
11099                   && !i.index_reg->reg_type.bitfield.zmmword
11100                   && ((addr_mode == CODE_64BIT
11101                        ? !i.index_reg->reg_type.bitfield.qword
11102                        : !i.index_reg->reg_type.bitfield.dword)
11103                       || !i.index_reg->reg_type.bitfield.baseindex)))
11104             goto bad_address;
11105
11106           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11107           if ((t->opcode_modifier.opcodeprefix == PREFIX_0XF3
11108                && t->base_opcode == 0x0f1b)
11109               || (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11110                   && (t->base_opcode & ~1) == 0x0f1a)
11111               || t->opcode_modifier.sib == SIBMEM)
11112             {
11113               /* They cannot use RIP-relative addressing. */
11114               if (i.base_reg && i.base_reg->reg_num == RegIP)
11115                 {
11116                   as_bad (_("`%s' cannot be used here"), operand_string);
11117                   return 0;
11118                 }
11119
11120               /* bndldx and bndstx ignore their scale factor. */
11121               if (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11122                   && (t->base_opcode & ~1) == 0x0f1a
11123                   && i.log2_scale_factor)
11124                 as_warn (_("register scaling is being ignored here"));
11125             }
11126         }
11127       else
11128         {
11129           /* 16-bit checks.  */
11130           if (i.disp_encoding == disp_encoding_32bit)
11131             goto bad_disp;
11132
11133           if ((i.base_reg
11134                && (!i.base_reg->reg_type.bitfield.word
11135                    || !i.base_reg->reg_type.bitfield.baseindex))
11136               || (i.index_reg
11137                   && (!i.index_reg->reg_type.bitfield.word
11138                       || !i.index_reg->reg_type.bitfield.baseindex
11139                       || !(i.base_reg
11140                            && i.base_reg->reg_num < 6
11141                            && i.index_reg->reg_num >= 6
11142                            && i.log2_scale_factor == 0))))
11143             goto bad_address;
11144         }
11145     }
11146   return 1;
11147 }
11148
11149 /* Handle vector immediates.  */
11150
11151 static int
11152 RC_SAE_immediate (const char *imm_start)
11153 {
11154   unsigned int match_found, j;
11155   const char *pstr = imm_start;
11156   expressionS *exp;
11157
11158   if (*pstr != '{')
11159     return 0;
11160
11161   pstr++;
11162   match_found = 0;
11163   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11164     {
11165       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11166         {
11167           if (!i.rounding)
11168             {
11169               rc_op.type = RC_NamesTable[j].type;
11170               rc_op.operand = this_operand;
11171               i.rounding = &rc_op;
11172             }
11173           else
11174             {
11175               as_bad (_("duplicated `%s'"), imm_start);
11176               return 0;
11177             }
11178           pstr += RC_NamesTable[j].len;
11179           match_found = 1;
11180           break;
11181         }
11182     }
11183   if (!match_found)
11184     return 0;
11185
11186   if (*pstr++ != '}')
11187     {
11188       as_bad (_("Missing '}': '%s'"), imm_start);
11189       return 0;
11190     }
11191   /* RC/SAE immediate string should contain nothing more.  */;
11192   if (*pstr != 0)
11193     {
11194       as_bad (_("Junk after '}': '%s'"), imm_start);
11195       return 0;
11196     }
11197
11198   exp = &im_expressions[i.imm_operands++];
11199   i.op[this_operand].imms = exp;
11200
11201   exp->X_op = O_constant;
11202   exp->X_add_number = 0;
11203   exp->X_add_symbol = (symbolS *) 0;
11204   exp->X_op_symbol = (symbolS *) 0;
11205
11206   i.types[this_operand].bitfield.imm8 = 1;
11207   return 1;
11208 }
11209
11210 /* Only string instructions can have a second memory operand, so
11211    reduce current_templates to just those if it contains any.  */
11212 static int
11213 maybe_adjust_templates (void)
11214 {
11215   const insn_template *t;
11216
11217   gas_assert (i.mem_operands == 1);
11218
11219   for (t = current_templates->start; t < current_templates->end; ++t)
11220     if (t->opcode_modifier.isstring)
11221       break;
11222
11223   if (t < current_templates->end)
11224     {
11225       static templates aux_templates;
11226       bfd_boolean recheck;
11227
11228       aux_templates.start = t;
11229       for (; t < current_templates->end; ++t)
11230         if (!t->opcode_modifier.isstring)
11231           break;
11232       aux_templates.end = t;
11233
11234       /* Determine whether to re-check the first memory operand.  */
11235       recheck = (aux_templates.start != current_templates->start
11236                  || t != current_templates->end);
11237
11238       current_templates = &aux_templates;
11239
11240       if (recheck)
11241         {
11242           i.mem_operands = 0;
11243           if (i.memop1_string != NULL
11244               && i386_index_check (i.memop1_string) == 0)
11245             return 0;
11246           i.mem_operands = 1;
11247         }
11248     }
11249
11250   return 1;
11251 }
11252
11253 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11254    on error.  */
11255
11256 static int
11257 i386_att_operand (char *operand_string)
11258 {
11259   const reg_entry *r;
11260   char *end_op;
11261   char *op_string = operand_string;
11262
11263   if (is_space_char (*op_string))
11264     ++op_string;
11265
11266   /* We check for an absolute prefix (differentiating,
11267      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11268   if (*op_string == ABSOLUTE_PREFIX)
11269     {
11270       ++op_string;
11271       if (is_space_char (*op_string))
11272         ++op_string;
11273       i.jumpabsolute = TRUE;
11274     }
11275
11276   /* Check if operand is a register.  */
11277   if ((r = parse_register (op_string, &end_op)) != NULL)
11278     {
11279       i386_operand_type temp;
11280
11281       if (r == &bad_reg)
11282         return 0;
11283
11284       /* Check for a segment override by searching for ':' after a
11285          segment register.  */
11286       op_string = end_op;
11287       if (is_space_char (*op_string))
11288         ++op_string;
11289       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11290         {
11291           switch (r->reg_num)
11292             {
11293             case 0:
11294               i.seg[i.mem_operands] = &es;
11295               break;
11296             case 1:
11297               i.seg[i.mem_operands] = &cs;
11298               break;
11299             case 2:
11300               i.seg[i.mem_operands] = &ss;
11301               break;
11302             case 3:
11303               i.seg[i.mem_operands] = &ds;
11304               break;
11305             case 4:
11306               i.seg[i.mem_operands] = &fs;
11307               break;
11308             case 5:
11309               i.seg[i.mem_operands] = &gs;
11310               break;
11311             }
11312
11313           /* Skip the ':' and whitespace.  */
11314           ++op_string;
11315           if (is_space_char (*op_string))
11316             ++op_string;
11317
11318           if (!is_digit_char (*op_string)
11319               && !is_identifier_char (*op_string)
11320               && *op_string != '('
11321               && *op_string != ABSOLUTE_PREFIX)
11322             {
11323               as_bad (_("bad memory operand `%s'"), op_string);
11324               return 0;
11325             }
11326           /* Handle case of %es:*foo.  */
11327           if (*op_string == ABSOLUTE_PREFIX)
11328             {
11329               ++op_string;
11330               if (is_space_char (*op_string))
11331                 ++op_string;
11332               i.jumpabsolute = TRUE;
11333             }
11334           goto do_memory_reference;
11335         }
11336
11337       /* Handle vector operations.  */
11338       if (*op_string == '{')
11339         {
11340           op_string = check_VecOperations (op_string, NULL);
11341           if (op_string == NULL)
11342             return 0;
11343         }
11344
11345       if (*op_string)
11346         {
11347           as_bad (_("junk `%s' after register"), op_string);
11348           return 0;
11349         }
11350       temp = r->reg_type;
11351       temp.bitfield.baseindex = 0;
11352       i.types[this_operand] = operand_type_or (i.types[this_operand],
11353                                                temp);
11354       i.types[this_operand].bitfield.unspecified = 0;
11355       i.op[this_operand].regs = r;
11356       i.reg_operands++;
11357     }
11358   else if (*op_string == REGISTER_PREFIX)
11359     {
11360       as_bad (_("bad register name `%s'"), op_string);
11361       return 0;
11362     }
11363   else if (*op_string == IMMEDIATE_PREFIX)
11364     {
11365       ++op_string;
11366       if (i.jumpabsolute)
11367         {
11368           as_bad (_("immediate operand illegal with absolute jump"));
11369           return 0;
11370         }
11371       if (!i386_immediate (op_string))
11372         return 0;
11373     }
11374   else if (RC_SAE_immediate (operand_string))
11375     {
11376       /* If it is a RC or SAE immediate, do nothing.  */
11377       ;
11378     }
11379   else if (is_digit_char (*op_string)
11380            || is_identifier_char (*op_string)
11381            || *op_string == '"'
11382            || *op_string == '(')
11383     {
11384       /* This is a memory reference of some sort.  */
11385       char *base_string;
11386
11387       /* Start and end of displacement string expression (if found).  */
11388       char *displacement_string_start;
11389       char *displacement_string_end;
11390       char *vop_start;
11391
11392     do_memory_reference:
11393       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11394         return 0;
11395       if ((i.mem_operands == 1
11396            && !current_templates->start->opcode_modifier.isstring)
11397           || i.mem_operands == 2)
11398         {
11399           as_bad (_("too many memory references for `%s'"),
11400                   current_templates->start->name);
11401           return 0;
11402         }
11403
11404       /* Check for base index form.  We detect the base index form by
11405          looking for an ')' at the end of the operand, searching
11406          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11407          after the '('.  */
11408       base_string = op_string + strlen (op_string);
11409
11410       /* Handle vector operations.  */
11411       vop_start = strchr (op_string, '{');
11412       if (vop_start && vop_start < base_string)
11413         {
11414           if (check_VecOperations (vop_start, base_string) == NULL)
11415             return 0;
11416           base_string = vop_start;
11417         }
11418
11419       --base_string;
11420       if (is_space_char (*base_string))
11421         --base_string;
11422
11423       /* If we only have a displacement, set-up for it to be parsed later.  */
11424       displacement_string_start = op_string;
11425       displacement_string_end = base_string + 1;
11426
11427       if (*base_string == ')')
11428         {
11429           char *temp_string;
11430           unsigned int parens_balanced = 1;
11431           /* We've already checked that the number of left & right ()'s are
11432              equal, so this loop will not be infinite.  */
11433           do
11434             {
11435               base_string--;
11436               if (*base_string == ')')
11437                 parens_balanced++;
11438               if (*base_string == '(')
11439                 parens_balanced--;
11440             }
11441           while (parens_balanced);
11442
11443           temp_string = base_string;
11444
11445           /* Skip past '(' and whitespace.  */
11446           ++base_string;
11447           if (is_space_char (*base_string))
11448             ++base_string;
11449
11450           if (*base_string == ','
11451               || ((i.base_reg = parse_register (base_string, &end_op))
11452                   != NULL))
11453             {
11454               displacement_string_end = temp_string;
11455
11456               i.types[this_operand].bitfield.baseindex = 1;
11457
11458               if (i.base_reg)
11459                 {
11460                   if (i.base_reg == &bad_reg)
11461                     return 0;
11462                   base_string = end_op;
11463                   if (is_space_char (*base_string))
11464                     ++base_string;
11465                 }
11466
11467               /* There may be an index reg or scale factor here.  */
11468               if (*base_string == ',')
11469                 {
11470                   ++base_string;
11471                   if (is_space_char (*base_string))
11472                     ++base_string;
11473
11474                   if ((i.index_reg = parse_register (base_string, &end_op))
11475                       != NULL)
11476                     {
11477                       if (i.index_reg == &bad_reg)
11478                         return 0;
11479                       base_string = end_op;
11480                       if (is_space_char (*base_string))
11481                         ++base_string;
11482                       if (*base_string == ',')
11483                         {
11484                           ++base_string;
11485                           if (is_space_char (*base_string))
11486                             ++base_string;
11487                         }
11488                       else if (*base_string != ')')
11489                         {
11490                           as_bad (_("expecting `,' or `)' "
11491                                     "after index register in `%s'"),
11492                                   operand_string);
11493                           return 0;
11494                         }
11495                     }
11496                   else if (*base_string == REGISTER_PREFIX)
11497                     {
11498                       end_op = strchr (base_string, ',');
11499                       if (end_op)
11500                         *end_op = '\0';
11501                       as_bad (_("bad register name `%s'"), base_string);
11502                       return 0;
11503                     }
11504
11505                   /* Check for scale factor.  */
11506                   if (*base_string != ')')
11507                     {
11508                       char *end_scale = i386_scale (base_string);
11509
11510                       if (!end_scale)
11511                         return 0;
11512
11513                       base_string = end_scale;
11514                       if (is_space_char (*base_string))
11515                         ++base_string;
11516                       if (*base_string != ')')
11517                         {
11518                           as_bad (_("expecting `)' "
11519                                     "after scale factor in `%s'"),
11520                                   operand_string);
11521                           return 0;
11522                         }
11523                     }
11524                   else if (!i.index_reg)
11525                     {
11526                       as_bad (_("expecting index register or scale factor "
11527                                 "after `,'; got '%c'"),
11528                               *base_string);
11529                       return 0;
11530                     }
11531                 }
11532               else if (*base_string != ')')
11533                 {
11534                   as_bad (_("expecting `,' or `)' "
11535                             "after base register in `%s'"),
11536                           operand_string);
11537                   return 0;
11538                 }
11539             }
11540           else if (*base_string == REGISTER_PREFIX)
11541             {
11542               end_op = strchr (base_string, ',');
11543               if (end_op)
11544                 *end_op = '\0';
11545               as_bad (_("bad register name `%s'"), base_string);
11546               return 0;
11547             }
11548         }
11549
11550       /* If there's an expression beginning the operand, parse it,
11551          assuming displacement_string_start and
11552          displacement_string_end are meaningful.  */
11553       if (displacement_string_start != displacement_string_end)
11554         {
11555           if (!i386_displacement (displacement_string_start,
11556                                   displacement_string_end))
11557             return 0;
11558         }
11559
11560       /* Special case for (%dx) while doing input/output op.  */
11561       if (i.base_reg
11562           && i.base_reg->reg_type.bitfield.instance == RegD
11563           && i.base_reg->reg_type.bitfield.word
11564           && i.index_reg == 0
11565           && i.log2_scale_factor == 0
11566           && i.seg[i.mem_operands] == 0
11567           && !operand_type_check (i.types[this_operand], disp))
11568         {
11569           i.types[this_operand] = i.base_reg->reg_type;
11570           return 1;
11571         }
11572
11573       if (i386_index_check (operand_string) == 0)
11574         return 0;
11575       i.flags[this_operand] |= Operand_Mem;
11576       if (i.mem_operands == 0)
11577         i.memop1_string = xstrdup (operand_string);
11578       i.mem_operands++;
11579     }
11580   else
11581     {
11582       /* It's not a memory operand; argh!  */
11583       as_bad (_("invalid char %s beginning operand %d `%s'"),
11584               output_invalid (*op_string),
11585               this_operand + 1,
11586               op_string);
11587       return 0;
11588     }
11589   return 1;                     /* Normal return.  */
11590 }
11591 \f
11592 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11593    that an rs_machine_dependent frag may reach.  */
11594
11595 unsigned int
11596 i386_frag_max_var (fragS *frag)
11597 {
11598   /* The only relaxable frags are for jumps.
11599      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11600   gas_assert (frag->fr_type == rs_machine_dependent);
11601   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11602 }
11603
11604 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11605 static int
11606 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11607 {
11608   /* STT_GNU_IFUNC symbol must go through PLT.  */
11609   if ((symbol_get_bfdsym (fr_symbol)->flags
11610        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11611     return 0;
11612
11613   if (!S_IS_EXTERNAL (fr_symbol))
11614     /* Symbol may be weak or local.  */
11615     return !S_IS_WEAK (fr_symbol);
11616
11617   /* Global symbols with non-default visibility can't be preempted. */
11618   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11619     return 1;
11620
11621   if (fr_var != NO_RELOC)
11622     switch ((enum bfd_reloc_code_real) fr_var)
11623       {
11624       case BFD_RELOC_386_PLT32:
11625       case BFD_RELOC_X86_64_PLT32:
11626         /* Symbol with PLT relocation may be preempted. */
11627         return 0;
11628       default:
11629         abort ();
11630       }
11631
11632   /* Global symbols with default visibility in a shared library may be
11633      preempted by another definition.  */
11634   return !shared;
11635 }
11636 #endif
11637
11638 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11639    Note also work for Skylake and Cascadelake.
11640 ---------------------------------------------------------------------
11641 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11642 | ------  | ----------- | ------- | -------- |
11643 |   Jo    |      N      |    N    |     Y    |
11644 |   Jno   |      N      |    N    |     Y    |
11645 |  Jc/Jb  |      Y      |    N    |     Y    |
11646 | Jae/Jnb |      Y      |    N    |     Y    |
11647 |  Je/Jz  |      Y      |    Y    |     Y    |
11648 | Jne/Jnz |      Y      |    Y    |     Y    |
11649 | Jna/Jbe |      Y      |    N    |     Y    |
11650 | Ja/Jnbe |      Y      |    N    |     Y    |
11651 |   Js    |      N      |    N    |     Y    |
11652 |   Jns   |      N      |    N    |     Y    |
11653 |  Jp/Jpe |      N      |    N    |     Y    |
11654 | Jnp/Jpo |      N      |    N    |     Y    |
11655 | Jl/Jnge |      Y      |    Y    |     Y    |
11656 | Jge/Jnl |      Y      |    Y    |     Y    |
11657 | Jle/Jng |      Y      |    Y    |     Y    |
11658 | Jg/Jnle |      Y      |    Y    |     Y    |
11659 ---------------------------------------------------------------------  */
11660 static int
11661 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11662 {
11663   if (mf_cmp == mf_cmp_alu_cmp)
11664     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11665             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11666   if (mf_cmp == mf_cmp_incdec)
11667     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11668             || mf_jcc == mf_jcc_jle);
11669   if (mf_cmp == mf_cmp_test_and)
11670     return 1;
11671   return 0;
11672 }
11673
11674 /* Return the next non-empty frag.  */
11675
11676 static fragS *
11677 i386_next_non_empty_frag (fragS *fragP)
11678 {
11679   /* There may be a frag with a ".fill 0" when there is no room in
11680      the current frag for frag_grow in output_insn.  */
11681   for (fragP = fragP->fr_next;
11682        (fragP != NULL
11683         && fragP->fr_type == rs_fill
11684         && fragP->fr_fix == 0);
11685        fragP = fragP->fr_next)
11686     ;
11687   return fragP;
11688 }
11689
11690 /* Return the next jcc frag after BRANCH_PADDING.  */
11691
11692 static fragS *
11693 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11694 {
11695   fragS *branch_fragP;
11696   if (!pad_fragP)
11697     return NULL;
11698
11699   if (pad_fragP->fr_type == rs_machine_dependent
11700       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11701           == BRANCH_PADDING))
11702     {
11703       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11704       if (branch_fragP->fr_type != rs_machine_dependent)
11705         return NULL;
11706       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11707           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11708                                    pad_fragP->tc_frag_data.mf_type))
11709         return branch_fragP;
11710     }
11711
11712   return NULL;
11713 }
11714
11715 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11716
11717 static void
11718 i386_classify_machine_dependent_frag (fragS *fragP)
11719 {
11720   fragS *cmp_fragP;
11721   fragS *pad_fragP;
11722   fragS *branch_fragP;
11723   fragS *next_fragP;
11724   unsigned int max_prefix_length;
11725
11726   if (fragP->tc_frag_data.classified)
11727     return;
11728
11729   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11730      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11731   for (next_fragP = fragP;
11732        next_fragP != NULL;
11733        next_fragP = next_fragP->fr_next)
11734     {
11735       next_fragP->tc_frag_data.classified = 1;
11736       if (next_fragP->fr_type == rs_machine_dependent)
11737         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11738           {
11739           case BRANCH_PADDING:
11740             /* The BRANCH_PADDING frag must be followed by a branch
11741                frag.  */
11742             branch_fragP = i386_next_non_empty_frag (next_fragP);
11743             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11744             break;
11745           case FUSED_JCC_PADDING:
11746             /* Check if this is a fused jcc:
11747                FUSED_JCC_PADDING
11748                CMP like instruction
11749                BRANCH_PADDING
11750                COND_JUMP
11751                */
11752             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11753             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11754             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11755             if (branch_fragP)
11756               {
11757                 /* The BRANCH_PADDING frag is merged with the
11758                    FUSED_JCC_PADDING frag.  */
11759                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11760                 /* CMP like instruction size.  */
11761                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11762                 frag_wane (pad_fragP);
11763                 /* Skip to branch_fragP.  */
11764                 next_fragP = branch_fragP;
11765               }
11766             else if (next_fragP->tc_frag_data.max_prefix_length)
11767               {
11768                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11769                    a fused jcc.  */
11770                 next_fragP->fr_subtype
11771                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11772                 next_fragP->tc_frag_data.max_bytes
11773                   = next_fragP->tc_frag_data.max_prefix_length;
11774                 /* This will be updated in the BRANCH_PREFIX scan.  */
11775                 next_fragP->tc_frag_data.max_prefix_length = 0;
11776               }
11777             else
11778               frag_wane (next_fragP);
11779             break;
11780           }
11781     }
11782
11783   /* Stop if there is no BRANCH_PREFIX.  */
11784   if (!align_branch_prefix_size)
11785     return;
11786
11787   /* Scan for BRANCH_PREFIX.  */
11788   for (; fragP != NULL; fragP = fragP->fr_next)
11789     {
11790       if (fragP->fr_type != rs_machine_dependent
11791           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11792               != BRANCH_PREFIX))
11793         continue;
11794
11795       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11796          COND_JUMP_PREFIX.  */
11797       max_prefix_length = 0;
11798       for (next_fragP = fragP;
11799            next_fragP != NULL;
11800            next_fragP = next_fragP->fr_next)
11801         {
11802           if (next_fragP->fr_type == rs_fill)
11803             /* Skip rs_fill frags.  */
11804             continue;
11805           else if (next_fragP->fr_type != rs_machine_dependent)
11806             /* Stop for all other frags.  */
11807             break;
11808
11809           /* rs_machine_dependent frags.  */
11810           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11811               == BRANCH_PREFIX)
11812             {
11813               /* Count BRANCH_PREFIX frags.  */
11814               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11815                 {
11816                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11817                   frag_wane (next_fragP);
11818                 }
11819               else
11820                 max_prefix_length
11821                   += next_fragP->tc_frag_data.max_bytes;
11822             }
11823           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11824                     == BRANCH_PADDING)
11825                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11826                        == FUSED_JCC_PADDING))
11827             {
11828               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11829               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11830               break;
11831             }
11832           else
11833             /* Stop for other rs_machine_dependent frags.  */
11834             break;
11835         }
11836
11837       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11838
11839       /* Skip to the next frag.  */
11840       fragP = next_fragP;
11841     }
11842 }
11843
11844 /* Compute padding size for
11845
11846         FUSED_JCC_PADDING
11847         CMP like instruction
11848         BRANCH_PADDING
11849         COND_JUMP/UNCOND_JUMP
11850
11851    or
11852
11853         BRANCH_PADDING
11854         COND_JUMP/UNCOND_JUMP
11855  */
11856
11857 static int
11858 i386_branch_padding_size (fragS *fragP, offsetT address)
11859 {
11860   unsigned int offset, size, padding_size;
11861   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11862
11863   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11864   if (!address)
11865     address = fragP->fr_address;
11866   address += fragP->fr_fix;
11867
11868   /* CMP like instrunction size.  */
11869   size = fragP->tc_frag_data.cmp_size;
11870
11871   /* The base size of the branch frag.  */
11872   size += branch_fragP->fr_fix;
11873
11874   /* Add opcode and displacement bytes for the rs_machine_dependent
11875      branch frag.  */
11876   if (branch_fragP->fr_type == rs_machine_dependent)
11877     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11878
11879   /* Check if branch is within boundary and doesn't end at the last
11880      byte.  */
11881   offset = address & ((1U << align_branch_power) - 1);
11882   if ((offset + size) >= (1U << align_branch_power))
11883     /* Padding needed to avoid crossing boundary.  */
11884     padding_size = (1U << align_branch_power) - offset;
11885   else
11886     /* No padding needed.  */
11887     padding_size = 0;
11888
11889   /* The return value may be saved in tc_frag_data.length which is
11890      unsigned byte.  */
11891   if (!fits_in_unsigned_byte (padding_size))
11892     abort ();
11893
11894   return padding_size;
11895 }
11896
11897 /* i386_generic_table_relax_frag()
11898
11899    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11900    grow/shrink padding to align branch frags.  Hand others to
11901    relax_frag().  */
11902
11903 long
11904 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11905 {
11906   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11907       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11908     {
11909       long padding_size = i386_branch_padding_size (fragP, 0);
11910       long grow = padding_size - fragP->tc_frag_data.length;
11911
11912       /* When the BRANCH_PREFIX frag is used, the computed address
11913          must match the actual address and there should be no padding.  */
11914       if (fragP->tc_frag_data.padding_address
11915           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11916               || padding_size))
11917         abort ();
11918
11919       /* Update the padding size.  */
11920       if (grow)
11921         fragP->tc_frag_data.length = padding_size;
11922
11923       return grow;
11924     }
11925   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11926     {
11927       fragS *padding_fragP, *next_fragP;
11928       long padding_size, left_size, last_size;
11929
11930       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11931       if (!padding_fragP)
11932         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11933         return (fragP->tc_frag_data.length
11934                 - fragP->tc_frag_data.last_length);
11935
11936       /* Compute the relative address of the padding frag in the very
11937         first time where the BRANCH_PREFIX frag sizes are zero.  */
11938       if (!fragP->tc_frag_data.padding_address)
11939         fragP->tc_frag_data.padding_address
11940           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11941
11942       /* First update the last length from the previous interation.  */
11943       left_size = fragP->tc_frag_data.prefix_length;
11944       for (next_fragP = fragP;
11945            next_fragP != padding_fragP;
11946            next_fragP = next_fragP->fr_next)
11947         if (next_fragP->fr_type == rs_machine_dependent
11948             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11949                 == BRANCH_PREFIX))
11950           {
11951             if (left_size)
11952               {
11953                 int max = next_fragP->tc_frag_data.max_bytes;
11954                 if (max)
11955                   {
11956                     int size;
11957                     if (max > left_size)
11958                       size = left_size;
11959                     else
11960                       size = max;
11961                     left_size -= size;
11962                     next_fragP->tc_frag_data.last_length = size;
11963                   }
11964               }
11965             else
11966               next_fragP->tc_frag_data.last_length = 0;
11967           }
11968
11969       /* Check the padding size for the padding frag.  */
11970       padding_size = i386_branch_padding_size
11971         (padding_fragP, (fragP->fr_address
11972                          + fragP->tc_frag_data.padding_address));
11973
11974       last_size = fragP->tc_frag_data.prefix_length;
11975       /* Check if there is change from the last interation.  */
11976       if (padding_size == last_size)
11977         {
11978           /* Update the expected address of the padding frag.  */
11979           padding_fragP->tc_frag_data.padding_address
11980             = (fragP->fr_address + padding_size
11981                + fragP->tc_frag_data.padding_address);
11982           return 0;
11983         }
11984
11985       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11986         {
11987           /* No padding if there is no sufficient room.  Clear the
11988              expected address of the padding frag.  */
11989           padding_fragP->tc_frag_data.padding_address = 0;
11990           padding_size = 0;
11991         }
11992       else
11993         /* Store the expected address of the padding frag.  */
11994         padding_fragP->tc_frag_data.padding_address
11995           = (fragP->fr_address + padding_size
11996              + fragP->tc_frag_data.padding_address);
11997
11998       fragP->tc_frag_data.prefix_length = padding_size;
11999
12000       /* Update the length for the current interation.  */
12001       left_size = padding_size;
12002       for (next_fragP = fragP;
12003            next_fragP != padding_fragP;
12004            next_fragP = next_fragP->fr_next)
12005         if (next_fragP->fr_type == rs_machine_dependent
12006             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12007                 == BRANCH_PREFIX))
12008           {
12009             if (left_size)
12010               {
12011                 int max = next_fragP->tc_frag_data.max_bytes;
12012                 if (max)
12013                   {
12014                     int size;
12015                     if (max > left_size)
12016                       size = left_size;
12017                     else
12018                       size = max;
12019                     left_size -= size;
12020                     next_fragP->tc_frag_data.length = size;
12021                   }
12022               }
12023             else
12024               next_fragP->tc_frag_data.length = 0;
12025           }
12026
12027       return (fragP->tc_frag_data.length
12028               - fragP->tc_frag_data.last_length);
12029     }
12030   return relax_frag (segment, fragP, stretch);
12031 }
12032
12033 /* md_estimate_size_before_relax()
12034
12035    Called just before relax() for rs_machine_dependent frags.  The x86
12036    assembler uses these frags to handle variable size jump
12037    instructions.
12038
12039    Any symbol that is now undefined will not become defined.
12040    Return the correct fr_subtype in the frag.
12041    Return the initial "guess for variable size of frag" to caller.
12042    The guess is actually the growth beyond the fixed part.  Whatever
12043    we do to grow the fixed or variable part contributes to our
12044    returned value.  */
12045
12046 int
12047 md_estimate_size_before_relax (fragS *fragP, segT segment)
12048 {
12049   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12050       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12051       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12052     {
12053       i386_classify_machine_dependent_frag (fragP);
12054       return fragP->tc_frag_data.length;
12055     }
12056
12057   /* We've already got fragP->fr_subtype right;  all we have to do is
12058      check for un-relaxable symbols.  On an ELF system, we can't relax
12059      an externally visible symbol, because it may be overridden by a
12060      shared library.  */
12061   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12062 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12063       || (IS_ELF
12064           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12065                                                 fragP->fr_var))
12066 #endif
12067 #if defined (OBJ_COFF) && defined (TE_PE)
12068       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12069           && S_IS_WEAK (fragP->fr_symbol))
12070 #endif
12071       )
12072     {
12073       /* Symbol is undefined in this segment, or we need to keep a
12074          reloc so that weak symbols can be overridden.  */
12075       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12076       enum bfd_reloc_code_real reloc_type;
12077       unsigned char *opcode;
12078       int old_fr_fix;
12079
12080       if (fragP->fr_var != NO_RELOC)
12081         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12082       else if (size == 2)
12083         reloc_type = BFD_RELOC_16_PCREL;
12084 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12085       else if (need_plt32_p (fragP->fr_symbol))
12086         reloc_type = BFD_RELOC_X86_64_PLT32;
12087 #endif
12088       else
12089         reloc_type = BFD_RELOC_32_PCREL;
12090
12091       old_fr_fix = fragP->fr_fix;
12092       opcode = (unsigned char *) fragP->fr_opcode;
12093
12094       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12095         {
12096         case UNCOND_JUMP:
12097           /* Make jmp (0xeb) a (d)word displacement jump.  */
12098           opcode[0] = 0xe9;
12099           fragP->fr_fix += size;
12100           fix_new (fragP, old_fr_fix, size,
12101                    fragP->fr_symbol,
12102                    fragP->fr_offset, 1,
12103                    reloc_type);
12104           break;
12105
12106         case COND_JUMP86:
12107           if (size == 2
12108               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12109             {
12110               /* Negate the condition, and branch past an
12111                  unconditional jump.  */
12112               opcode[0] ^= 1;
12113               opcode[1] = 3;
12114               /* Insert an unconditional jump.  */
12115               opcode[2] = 0xe9;
12116               /* We added two extra opcode bytes, and have a two byte
12117                  offset.  */
12118               fragP->fr_fix += 2 + 2;
12119               fix_new (fragP, old_fr_fix + 2, 2,
12120                        fragP->fr_symbol,
12121                        fragP->fr_offset, 1,
12122                        reloc_type);
12123               break;
12124             }
12125           /* Fall through.  */
12126
12127         case COND_JUMP:
12128           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12129             {
12130               fixS *fixP;
12131
12132               fragP->fr_fix += 1;
12133               fixP = fix_new (fragP, old_fr_fix, 1,
12134                               fragP->fr_symbol,
12135                               fragP->fr_offset, 1,
12136                               BFD_RELOC_8_PCREL);
12137               fixP->fx_signed = 1;
12138               break;
12139             }
12140
12141           /* This changes the byte-displacement jump 0x7N
12142              to the (d)word-displacement jump 0x0f,0x8N.  */
12143           opcode[1] = opcode[0] + 0x10;
12144           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12145           /* We've added an opcode byte.  */
12146           fragP->fr_fix += 1 + size;
12147           fix_new (fragP, old_fr_fix + 1, size,
12148                    fragP->fr_symbol,
12149                    fragP->fr_offset, 1,
12150                    reloc_type);
12151           break;
12152
12153         default:
12154           BAD_CASE (fragP->fr_subtype);
12155           break;
12156         }
12157       frag_wane (fragP);
12158       return fragP->fr_fix - old_fr_fix;
12159     }
12160
12161   /* Guess size depending on current relax state.  Initially the relax
12162      state will correspond to a short jump and we return 1, because
12163      the variable part of the frag (the branch offset) is one byte
12164      long.  However, we can relax a section more than once and in that
12165      case we must either set fr_subtype back to the unrelaxed state,
12166      or return the value for the appropriate branch.  */
12167   return md_relax_table[fragP->fr_subtype].rlx_length;
12168 }
12169
12170 /* Called after relax() is finished.
12171
12172    In:  Address of frag.
12173         fr_type == rs_machine_dependent.
12174         fr_subtype is what the address relaxed to.
12175
12176    Out: Any fixSs and constants are set up.
12177         Caller will turn frag into a ".space 0".  */
12178
12179 void
12180 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12181                  fragS *fragP)
12182 {
12183   unsigned char *opcode;
12184   unsigned char *where_to_put_displacement = NULL;
12185   offsetT target_address;
12186   offsetT opcode_address;
12187   unsigned int extension = 0;
12188   offsetT displacement_from_opcode_start;
12189
12190   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12191       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12192       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12193     {
12194       /* Generate nop padding.  */
12195       unsigned int size = fragP->tc_frag_data.length;
12196       if (size)
12197         {
12198           if (size > fragP->tc_frag_data.max_bytes)
12199             abort ();
12200
12201           if (flag_debug)
12202             {
12203               const char *msg;
12204               const char *branch = "branch";
12205               const char *prefix = "";
12206               fragS *padding_fragP;
12207               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12208                   == BRANCH_PREFIX)
12209                 {
12210                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12211                   switch (fragP->tc_frag_data.default_prefix)
12212                     {
12213                     default:
12214                       abort ();
12215                       break;
12216                     case CS_PREFIX_OPCODE:
12217                       prefix = " cs";
12218                       break;
12219                     case DS_PREFIX_OPCODE:
12220                       prefix = " ds";
12221                       break;
12222                     case ES_PREFIX_OPCODE:
12223                       prefix = " es";
12224                       break;
12225                     case FS_PREFIX_OPCODE:
12226                       prefix = " fs";
12227                       break;
12228                     case GS_PREFIX_OPCODE:
12229                       prefix = " gs";
12230                       break;
12231                     case SS_PREFIX_OPCODE:
12232                       prefix = " ss";
12233                       break;
12234                     }
12235                   if (padding_fragP)
12236                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12237                             "%s within %d-byte boundary\n");
12238                   else
12239                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12240                             "align %s within %d-byte boundary\n");
12241                 }
12242               else
12243                 {
12244                   padding_fragP = fragP;
12245                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12246                           "%s within %d-byte boundary\n");
12247                 }
12248
12249               if (padding_fragP)
12250                 switch (padding_fragP->tc_frag_data.branch_type)
12251                   {
12252                   case align_branch_jcc:
12253                     branch = "jcc";
12254                     break;
12255                   case align_branch_fused:
12256                     branch = "fused jcc";
12257                     break;
12258                   case align_branch_jmp:
12259                     branch = "jmp";
12260                     break;
12261                   case align_branch_call:
12262                     branch = "call";
12263                     break;
12264                   case align_branch_indirect:
12265                     branch = "indiret branch";
12266                     break;
12267                   case align_branch_ret:
12268                     branch = "ret";
12269                     break;
12270                   default:
12271                     break;
12272                   }
12273
12274               fprintf (stdout, msg,
12275                        fragP->fr_file, fragP->fr_line, size, prefix,
12276                        (long long) fragP->fr_address, branch,
12277                        1 << align_branch_power);
12278             }
12279           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12280             memset (fragP->fr_opcode,
12281                     fragP->tc_frag_data.default_prefix, size);
12282           else
12283             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12284                                 size, 0);
12285           fragP->fr_fix += size;
12286         }
12287       return;
12288     }
12289
12290   opcode = (unsigned char *) fragP->fr_opcode;
12291
12292   /* Address we want to reach in file space.  */
12293   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12294
12295   /* Address opcode resides at in file space.  */
12296   opcode_address = fragP->fr_address + fragP->fr_fix;
12297
12298   /* Displacement from opcode start to fill into instruction.  */
12299   displacement_from_opcode_start = target_address - opcode_address;
12300
12301   if ((fragP->fr_subtype & BIG) == 0)
12302     {
12303       /* Don't have to change opcode.  */
12304       extension = 1;            /* 1 opcode + 1 displacement  */
12305       where_to_put_displacement = &opcode[1];
12306     }
12307   else
12308     {
12309       if (no_cond_jump_promotion
12310           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12311         as_warn_where (fragP->fr_file, fragP->fr_line,
12312                        _("long jump required"));
12313
12314       switch (fragP->fr_subtype)
12315         {
12316         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12317           extension = 4;                /* 1 opcode + 4 displacement  */
12318           opcode[0] = 0xe9;
12319           where_to_put_displacement = &opcode[1];
12320           break;
12321
12322         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12323           extension = 2;                /* 1 opcode + 2 displacement  */
12324           opcode[0] = 0xe9;
12325           where_to_put_displacement = &opcode[1];
12326           break;
12327
12328         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12329         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12330           extension = 5;                /* 2 opcode + 4 displacement  */
12331           opcode[1] = opcode[0] + 0x10;
12332           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12333           where_to_put_displacement = &opcode[2];
12334           break;
12335
12336         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12337           extension = 3;                /* 2 opcode + 2 displacement  */
12338           opcode[1] = opcode[0] + 0x10;
12339           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12340           where_to_put_displacement = &opcode[2];
12341           break;
12342
12343         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12344           extension = 4;
12345           opcode[0] ^= 1;
12346           opcode[1] = 3;
12347           opcode[2] = 0xe9;
12348           where_to_put_displacement = &opcode[3];
12349           break;
12350
12351         default:
12352           BAD_CASE (fragP->fr_subtype);
12353           break;
12354         }
12355     }
12356
12357   /* If size if less then four we are sure that the operand fits,
12358      but if it's 4, then it could be that the displacement is larger
12359      then -/+ 2GB.  */
12360   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12361       && object_64bit
12362       && ((addressT) (displacement_from_opcode_start - extension
12363                       + ((addressT) 1 << 31))
12364           > (((addressT) 2 << 31) - 1)))
12365     {
12366       as_bad_where (fragP->fr_file, fragP->fr_line,
12367                     _("jump target out of range"));
12368       /* Make us emit 0.  */
12369       displacement_from_opcode_start = extension;
12370     }
12371   /* Now put displacement after opcode.  */
12372   md_number_to_chars ((char *) where_to_put_displacement,
12373                       (valueT) (displacement_from_opcode_start - extension),
12374                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12375   fragP->fr_fix += extension;
12376 }
12377 \f
12378 /* Apply a fixup (fixP) to segment data, once it has been determined
12379    by our caller that we have all the info we need to fix it up.
12380
12381    Parameter valP is the pointer to the value of the bits.
12382
12383    On the 386, immediates, displacements, and data pointers are all in
12384    the same (little-endian) format, so we don't need to care about which
12385    we are handling.  */
12386
12387 void
12388 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12389 {
12390   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12391   valueT value = *valP;
12392
12393 #if !defined (TE_Mach)
12394   if (fixP->fx_pcrel)
12395     {
12396       switch (fixP->fx_r_type)
12397         {
12398         default:
12399           break;
12400
12401         case BFD_RELOC_64:
12402           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12403           break;
12404         case BFD_RELOC_32:
12405         case BFD_RELOC_X86_64_32S:
12406           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12407           break;
12408         case BFD_RELOC_16:
12409           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12410           break;
12411         case BFD_RELOC_8:
12412           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12413           break;
12414         }
12415     }
12416
12417   if (fixP->fx_addsy != NULL
12418       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12419           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12420           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12421           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12422       && !use_rela_relocations)
12423     {
12424       /* This is a hack.  There should be a better way to handle this.
12425          This covers for the fact that bfd_install_relocation will
12426          subtract the current location (for partial_inplace, PC relative
12427          relocations); see more below.  */
12428 #ifndef OBJ_AOUT
12429       if (IS_ELF
12430 #ifdef TE_PE
12431           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12432 #endif
12433           )
12434         value += fixP->fx_where + fixP->fx_frag->fr_address;
12435 #endif
12436 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12437       if (IS_ELF)
12438         {
12439           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12440
12441           if ((sym_seg == seg
12442                || (symbol_section_p (fixP->fx_addsy)
12443                    && sym_seg != absolute_section))
12444               && !generic_force_reloc (fixP))
12445             {
12446               /* Yes, we add the values in twice.  This is because
12447                  bfd_install_relocation subtracts them out again.  I think
12448                  bfd_install_relocation is broken, but I don't dare change
12449                  it.  FIXME.  */
12450               value += fixP->fx_where + fixP->fx_frag->fr_address;
12451             }
12452         }
12453 #endif
12454 #if defined (OBJ_COFF) && defined (TE_PE)
12455       /* For some reason, the PE format does not store a
12456          section address offset for a PC relative symbol.  */
12457       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12458           || S_IS_WEAK (fixP->fx_addsy))
12459         value += md_pcrel_from (fixP);
12460 #endif
12461     }
12462 #if defined (OBJ_COFF) && defined (TE_PE)
12463   if (fixP->fx_addsy != NULL
12464       && S_IS_WEAK (fixP->fx_addsy)
12465       /* PR 16858: Do not modify weak function references.  */
12466       && ! fixP->fx_pcrel)
12467     {
12468 #if !defined (TE_PEP)
12469       /* For x86 PE weak function symbols are neither PC-relative
12470          nor do they set S_IS_FUNCTION.  So the only reliable way
12471          to detect them is to check the flags of their containing
12472          section.  */
12473       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12474           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12475         ;
12476       else
12477 #endif
12478       value -= S_GET_VALUE (fixP->fx_addsy);
12479     }
12480 #endif
12481
12482   /* Fix a few things - the dynamic linker expects certain values here,
12483      and we must not disappoint it.  */
12484 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12485   if (IS_ELF && fixP->fx_addsy)
12486     switch (fixP->fx_r_type)
12487       {
12488       case BFD_RELOC_386_PLT32:
12489       case BFD_RELOC_X86_64_PLT32:
12490         /* Make the jump instruction point to the address of the operand.
12491            At runtime we merely add the offset to the actual PLT entry.
12492            NB: Subtract the offset size only for jump instructions.  */
12493         if (fixP->fx_pcrel)
12494           value = -4;
12495         break;
12496
12497       case BFD_RELOC_386_TLS_GD:
12498       case BFD_RELOC_386_TLS_LDM:
12499       case BFD_RELOC_386_TLS_IE_32:
12500       case BFD_RELOC_386_TLS_IE:
12501       case BFD_RELOC_386_TLS_GOTIE:
12502       case BFD_RELOC_386_TLS_GOTDESC:
12503       case BFD_RELOC_X86_64_TLSGD:
12504       case BFD_RELOC_X86_64_TLSLD:
12505       case BFD_RELOC_X86_64_GOTTPOFF:
12506       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12507         value = 0; /* Fully resolved at runtime.  No addend.  */
12508         /* Fallthrough */
12509       case BFD_RELOC_386_TLS_LE:
12510       case BFD_RELOC_386_TLS_LDO_32:
12511       case BFD_RELOC_386_TLS_LE_32:
12512       case BFD_RELOC_X86_64_DTPOFF32:
12513       case BFD_RELOC_X86_64_DTPOFF64:
12514       case BFD_RELOC_X86_64_TPOFF32:
12515       case BFD_RELOC_X86_64_TPOFF64:
12516         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12517         break;
12518
12519       case BFD_RELOC_386_TLS_DESC_CALL:
12520       case BFD_RELOC_X86_64_TLSDESC_CALL:
12521         value = 0; /* Fully resolved at runtime.  No addend.  */
12522         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12523         fixP->fx_done = 0;
12524         return;
12525
12526       case BFD_RELOC_VTABLE_INHERIT:
12527       case BFD_RELOC_VTABLE_ENTRY:
12528         fixP->fx_done = 0;
12529         return;
12530
12531       default:
12532         break;
12533       }
12534 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12535   *valP = value;
12536 #endif /* !defined (TE_Mach)  */
12537
12538   /* Are we finished with this relocation now?  */
12539   if (fixP->fx_addsy == NULL)
12540     fixP->fx_done = 1;
12541 #if defined (OBJ_COFF) && defined (TE_PE)
12542   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12543     {
12544       fixP->fx_done = 0;
12545       /* Remember value for tc_gen_reloc.  */
12546       fixP->fx_addnumber = value;
12547       /* Clear out the frag for now.  */
12548       value = 0;
12549     }
12550 #endif
12551   else if (use_rela_relocations)
12552     {
12553       fixP->fx_no_overflow = 1;
12554       /* Remember value for tc_gen_reloc.  */
12555       fixP->fx_addnumber = value;
12556       value = 0;
12557     }
12558
12559   md_number_to_chars (p, value, fixP->fx_size);
12560 }
12561 \f
12562 const char *
12563 md_atof (int type, char *litP, int *sizeP)
12564 {
12565   /* This outputs the LITTLENUMs in REVERSE order;
12566      in accord with the bigendian 386.  */
12567   return ieee_md_atof (type, litP, sizeP, FALSE);
12568 }
12569 \f
12570 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12571
12572 static char *
12573 output_invalid (int c)
12574 {
12575   if (ISPRINT (c))
12576     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12577               "'%c'", c);
12578   else
12579     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12580               "(0x%x)", (unsigned char) c);
12581   return output_invalid_buf;
12582 }
12583
12584 /* Verify that @r can be used in the current context.  */
12585
12586 static bfd_boolean check_register (const reg_entry *r)
12587 {
12588   if (allow_pseudo_reg)
12589     return TRUE;
12590
12591   if (operand_type_all_zero (&r->reg_type))
12592     return FALSE;
12593
12594   if ((r->reg_type.bitfield.dword
12595        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12596        || r->reg_type.bitfield.class == RegCR
12597        || r->reg_type.bitfield.class == RegDR)
12598       && !cpu_arch_flags.bitfield.cpui386)
12599     return FALSE;
12600
12601   if (r->reg_type.bitfield.class == RegTR
12602       && (flag_code == CODE_64BIT
12603           || !cpu_arch_flags.bitfield.cpui386
12604           || cpu_arch_isa_flags.bitfield.cpui586
12605           || cpu_arch_isa_flags.bitfield.cpui686))
12606     return FALSE;
12607
12608   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12609     return FALSE;
12610
12611   if (!cpu_arch_flags.bitfield.cpuavx512f)
12612     {
12613       if (r->reg_type.bitfield.zmmword
12614           || r->reg_type.bitfield.class == RegMask)
12615         return FALSE;
12616
12617       if (!cpu_arch_flags.bitfield.cpuavx)
12618         {
12619           if (r->reg_type.bitfield.ymmword)
12620             return FALSE;
12621
12622           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12623             return FALSE;
12624         }
12625     }
12626
12627   if (r->reg_type.bitfield.tmmword
12628       && (!cpu_arch_flags.bitfield.cpuamx_tile
12629           || flag_code != CODE_64BIT))
12630     return FALSE;
12631
12632   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12633     return FALSE;
12634
12635   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12636   if (!allow_index_reg && r->reg_num == RegIZ)
12637     return FALSE;
12638
12639   /* Upper 16 vector registers are only available with VREX in 64bit
12640      mode, and require EVEX encoding.  */
12641   if (r->reg_flags & RegVRex)
12642     {
12643       if (!cpu_arch_flags.bitfield.cpuavx512f
12644           || flag_code != CODE_64BIT)
12645         return FALSE;
12646
12647       if (i.vec_encoding == vex_encoding_default)
12648         i.vec_encoding = vex_encoding_evex;
12649       else if (i.vec_encoding != vex_encoding_evex)
12650         i.vec_encoding = vex_encoding_error;
12651     }
12652
12653   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12654       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12655       && flag_code != CODE_64BIT)
12656     return FALSE;
12657
12658   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12659       && !intel_syntax)
12660     return FALSE;
12661
12662   return TRUE;
12663 }
12664
12665 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12666
12667 static const reg_entry *
12668 parse_real_register (char *reg_string, char **end_op)
12669 {
12670   char *s = reg_string;
12671   char *p;
12672   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12673   const reg_entry *r;
12674
12675   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12676   if (*s == REGISTER_PREFIX)
12677     ++s;
12678
12679   if (is_space_char (*s))
12680     ++s;
12681
12682   p = reg_name_given;
12683   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12684     {
12685       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12686         return (const reg_entry *) NULL;
12687       s++;
12688     }
12689
12690   /* For naked regs, make sure that we are not dealing with an identifier.
12691      This prevents confusing an identifier like `eax_var' with register
12692      `eax'.  */
12693   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12694     return (const reg_entry *) NULL;
12695
12696   *end_op = s;
12697
12698   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12699
12700   /* Handle floating point regs, allowing spaces in the (i) part.  */
12701   if (r == i386_regtab /* %st is first entry of table  */)
12702     {
12703       if (!cpu_arch_flags.bitfield.cpu8087
12704           && !cpu_arch_flags.bitfield.cpu287
12705           && !cpu_arch_flags.bitfield.cpu387
12706           && !allow_pseudo_reg)
12707         return (const reg_entry *) NULL;
12708
12709       if (is_space_char (*s))
12710         ++s;
12711       if (*s == '(')
12712         {
12713           ++s;
12714           if (is_space_char (*s))
12715             ++s;
12716           if (*s >= '0' && *s <= '7')
12717             {
12718               int fpr = *s - '0';
12719               ++s;
12720               if (is_space_char (*s))
12721                 ++s;
12722               if (*s == ')')
12723                 {
12724                   *end_op = s + 1;
12725                   r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12726                   know (r);
12727                   return r + fpr;
12728                 }
12729             }
12730           /* We have "%st(" then garbage.  */
12731           return (const reg_entry *) NULL;
12732         }
12733     }
12734
12735   return r && check_register (r) ? r : NULL;
12736 }
12737
12738 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12739
12740 static const reg_entry *
12741 parse_register (char *reg_string, char **end_op)
12742 {
12743   const reg_entry *r;
12744
12745   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12746     r = parse_real_register (reg_string, end_op);
12747   else
12748     r = NULL;
12749   if (!r)
12750     {
12751       char *save = input_line_pointer;
12752       char c;
12753       symbolS *symbolP;
12754
12755       input_line_pointer = reg_string;
12756       c = get_symbol_name (&reg_string);
12757       symbolP = symbol_find (reg_string);
12758       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12759         {
12760           const expressionS *e = symbol_get_value_expression (symbolP);
12761
12762           know (e->X_op == O_register);
12763           know (e->X_add_number >= 0
12764                 && (valueT) e->X_add_number < i386_regtab_size);
12765           r = i386_regtab + e->X_add_number;
12766           if (!check_register (r))
12767             {
12768               as_bad (_("register '%s%s' cannot be used here"),
12769                       register_prefix, r->reg_name);
12770               r = &bad_reg;
12771             }
12772           *end_op = input_line_pointer;
12773         }
12774       *input_line_pointer = c;
12775       input_line_pointer = save;
12776     }
12777   return r;
12778 }
12779
12780 int
12781 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12782 {
12783   const reg_entry *r;
12784   char *end = input_line_pointer;
12785
12786   *end = *nextcharP;
12787   r = parse_register (name, &input_line_pointer);
12788   if (r && end <= input_line_pointer)
12789     {
12790       *nextcharP = *input_line_pointer;
12791       *input_line_pointer = 0;
12792       if (r != &bad_reg)
12793         {
12794           e->X_op = O_register;
12795           e->X_add_number = r - i386_regtab;
12796         }
12797       else
12798           e->X_op = O_illegal;
12799       return 1;
12800     }
12801   input_line_pointer = end;
12802   *end = 0;
12803   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12804 }
12805
12806 void
12807 md_operand (expressionS *e)
12808 {
12809   char *end;
12810   const reg_entry *r;
12811
12812   switch (*input_line_pointer)
12813     {
12814     case REGISTER_PREFIX:
12815       r = parse_real_register (input_line_pointer, &end);
12816       if (r)
12817         {
12818           e->X_op = O_register;
12819           e->X_add_number = r - i386_regtab;
12820           input_line_pointer = end;
12821         }
12822       break;
12823
12824     case '[':
12825       gas_assert (intel_syntax);
12826       end = input_line_pointer++;
12827       expression (e);
12828       if (*input_line_pointer == ']')
12829         {
12830           ++input_line_pointer;
12831           e->X_op_symbol = make_expr_symbol (e);
12832           e->X_add_symbol = NULL;
12833           e->X_add_number = 0;
12834           e->X_op = O_index;
12835         }
12836       else
12837         {
12838           e->X_op = O_absent;
12839           input_line_pointer = end;
12840         }
12841       break;
12842     }
12843 }
12844
12845 \f
12846 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12847 const char *md_shortopts = "kVQ:sqnO::";
12848 #else
12849 const char *md_shortopts = "qnO::";
12850 #endif
12851
12852 #define OPTION_32 (OPTION_MD_BASE + 0)
12853 #define OPTION_64 (OPTION_MD_BASE + 1)
12854 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12855 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12856 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12857 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12858 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12859 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12860 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12861 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12862 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12863 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12864 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12865 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12866 #define OPTION_X32 (OPTION_MD_BASE + 14)
12867 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12868 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12869 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12870 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12871 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12872 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12873 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12874 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12875 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12876 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12877 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12878 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12879 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12880 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12881 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12882 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12883 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12884 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12885 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12886
12887 struct option md_longopts[] =
12888 {
12889   {"32", no_argument, NULL, OPTION_32},
12890 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12891      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12892   {"64", no_argument, NULL, OPTION_64},
12893 #endif
12894 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12895   {"x32", no_argument, NULL, OPTION_X32},
12896   {"mshared", no_argument, NULL, OPTION_MSHARED},
12897   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12898 #endif
12899   {"divide", no_argument, NULL, OPTION_DIVIDE},
12900   {"march", required_argument, NULL, OPTION_MARCH},
12901   {"mtune", required_argument, NULL, OPTION_MTUNE},
12902   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12903   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12904   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12905   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12906   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12907   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12908   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12909   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12910   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12911   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12912   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12913   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12914 # if defined (TE_PE) || defined (TE_PEP)
12915   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12916 #endif
12917   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12918   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12919   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12920   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12921   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12922   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12923   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12924   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12925   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12926   {"mlfence-before-indirect-branch", required_argument, NULL,
12927    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12928   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12929   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12930   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12931   {NULL, no_argument, NULL, 0}
12932 };
12933 size_t md_longopts_size = sizeof (md_longopts);
12934
12935 int
12936 md_parse_option (int c, const char *arg)
12937 {
12938   unsigned int j;
12939   char *arch, *next, *saved, *type;
12940
12941   switch (c)
12942     {
12943     case 'n':
12944       optimize_align_code = 0;
12945       break;
12946
12947     case 'q':
12948       quiet_warnings = 1;
12949       break;
12950
12951 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12952       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12953          should be emitted or not.  FIXME: Not implemented.  */
12954     case 'Q':
12955       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12956         return 0;
12957       break;
12958
12959       /* -V: SVR4 argument to print version ID.  */
12960     case 'V':
12961       print_version_id ();
12962       break;
12963
12964       /* -k: Ignore for FreeBSD compatibility.  */
12965     case 'k':
12966       break;
12967
12968     case 's':
12969       /* -s: On i386 Solaris, this tells the native assembler to use
12970          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12971       break;
12972
12973     case OPTION_MSHARED:
12974       shared = 1;
12975       break;
12976
12977     case OPTION_X86_USED_NOTE:
12978       if (strcasecmp (arg, "yes") == 0)
12979         x86_used_note = 1;
12980       else if (strcasecmp (arg, "no") == 0)
12981         x86_used_note = 0;
12982       else
12983         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12984       break;
12985
12986
12987 #endif
12988 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12989      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12990     case OPTION_64:
12991       {
12992         const char **list, **l;
12993
12994         list = bfd_target_list ();
12995         for (l = list; *l != NULL; l++)
12996           if (startswith (*l, "elf64-x86-64")
12997               || strcmp (*l, "coff-x86-64") == 0
12998               || strcmp (*l, "pe-x86-64") == 0
12999               || strcmp (*l, "pei-x86-64") == 0
13000               || strcmp (*l, "mach-o-x86-64") == 0)
13001             {
13002               default_arch = "x86_64";
13003               break;
13004             }
13005         if (*l == NULL)
13006           as_fatal (_("no compiled in support for x86_64"));
13007         free (list);
13008       }
13009       break;
13010 #endif
13011
13012 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13013     case OPTION_X32:
13014       if (IS_ELF)
13015         {
13016           const char **list, **l;
13017
13018           list = bfd_target_list ();
13019           for (l = list; *l != NULL; l++)
13020             if (startswith (*l, "elf32-x86-64"))
13021               {
13022                 default_arch = "x86_64:32";
13023                 break;
13024               }
13025           if (*l == NULL)
13026             as_fatal (_("no compiled in support for 32bit x86_64"));
13027           free (list);
13028         }
13029       else
13030         as_fatal (_("32bit x86_64 is only supported for ELF"));
13031       break;
13032 #endif
13033
13034     case OPTION_32:
13035       default_arch = "i386";
13036       break;
13037
13038     case OPTION_DIVIDE:
13039 #ifdef SVR4_COMMENT_CHARS
13040       {
13041         char *n, *t;
13042         const char *s;
13043
13044         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13045         t = n;
13046         for (s = i386_comment_chars; *s != '\0'; s++)
13047           if (*s != '/')
13048             *t++ = *s;
13049         *t = '\0';
13050         i386_comment_chars = n;
13051       }
13052 #endif
13053       break;
13054
13055     case OPTION_MARCH:
13056       saved = xstrdup (arg);
13057       arch = saved;
13058       /* Allow -march=+nosse.  */
13059       if (*arch == '+')
13060         arch++;
13061       do
13062         {
13063           if (*arch == '.')
13064             as_fatal (_("invalid -march= option: `%s'"), arg);
13065           next = strchr (arch, '+');
13066           if (next)
13067             *next++ = '\0';
13068           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13069             {
13070               if (strcmp (arch, cpu_arch [j].name) == 0)
13071                 {
13072                   /* Processor.  */
13073                   if (! cpu_arch[j].flags.bitfield.cpui386)
13074                     continue;
13075
13076                   cpu_arch_name = cpu_arch[j].name;
13077                   cpu_sub_arch_name = NULL;
13078                   cpu_arch_flags = cpu_arch[j].flags;
13079                   cpu_arch_isa = cpu_arch[j].type;
13080                   cpu_arch_isa_flags = cpu_arch[j].flags;
13081                   if (!cpu_arch_tune_set)
13082                     {
13083                       cpu_arch_tune = cpu_arch_isa;
13084                       cpu_arch_tune_flags = cpu_arch_isa_flags;
13085                     }
13086                   break;
13087                 }
13088               else if (*cpu_arch [j].name == '.'
13089                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
13090                 {
13091                   /* ISA extension.  */
13092                   i386_cpu_flags flags;
13093
13094                   flags = cpu_flags_or (cpu_arch_flags,
13095                                         cpu_arch[j].flags);
13096
13097                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13098                     {
13099                       if (cpu_sub_arch_name)
13100                         {
13101                           char *name = cpu_sub_arch_name;
13102                           cpu_sub_arch_name = concat (name,
13103                                                       cpu_arch[j].name,
13104                                                       (const char *) NULL);
13105                           free (name);
13106                         }
13107                       else
13108                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13109                       cpu_arch_flags = flags;
13110                       cpu_arch_isa_flags = flags;
13111                     }
13112                   else
13113                     cpu_arch_isa_flags
13114                       = cpu_flags_or (cpu_arch_isa_flags,
13115                                       cpu_arch[j].flags);
13116                   break;
13117                 }
13118             }
13119
13120           if (j >= ARRAY_SIZE (cpu_arch))
13121             {
13122               /* Disable an ISA extension.  */
13123               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13124                 if (strcmp (arch, cpu_noarch [j].name) == 0)
13125                   {
13126                     i386_cpu_flags flags;
13127
13128                     flags = cpu_flags_and_not (cpu_arch_flags,
13129                                                cpu_noarch[j].flags);
13130                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13131                       {
13132                         if (cpu_sub_arch_name)
13133                           {
13134                             char *name = cpu_sub_arch_name;
13135                             cpu_sub_arch_name = concat (arch,
13136                                                         (const char *) NULL);
13137                             free (name);
13138                           }
13139                         else
13140                           cpu_sub_arch_name = xstrdup (arch);
13141                         cpu_arch_flags = flags;
13142                         cpu_arch_isa_flags = flags;
13143                       }
13144                     break;
13145                   }
13146
13147               if (j >= ARRAY_SIZE (cpu_noarch))
13148                 j = ARRAY_SIZE (cpu_arch);
13149             }
13150
13151           if (j >= ARRAY_SIZE (cpu_arch))
13152             as_fatal (_("invalid -march= option: `%s'"), arg);
13153
13154           arch = next;
13155         }
13156       while (next != NULL);
13157       free (saved);
13158       break;
13159
13160     case OPTION_MTUNE:
13161       if (*arg == '.')
13162         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13163       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13164         {
13165           if (strcmp (arg, cpu_arch [j].name) == 0)
13166             {
13167               cpu_arch_tune_set = 1;
13168               cpu_arch_tune = cpu_arch [j].type;
13169               cpu_arch_tune_flags = cpu_arch[j].flags;
13170               break;
13171             }
13172         }
13173       if (j >= ARRAY_SIZE (cpu_arch))
13174         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13175       break;
13176
13177     case OPTION_MMNEMONIC:
13178       if (strcasecmp (arg, "att") == 0)
13179         intel_mnemonic = 0;
13180       else if (strcasecmp (arg, "intel") == 0)
13181         intel_mnemonic = 1;
13182       else
13183         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13184       break;
13185
13186     case OPTION_MSYNTAX:
13187       if (strcasecmp (arg, "att") == 0)
13188         intel_syntax = 0;
13189       else if (strcasecmp (arg, "intel") == 0)
13190         intel_syntax = 1;
13191       else
13192         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13193       break;
13194
13195     case OPTION_MINDEX_REG:
13196       allow_index_reg = 1;
13197       break;
13198
13199     case OPTION_MNAKED_REG:
13200       allow_naked_reg = 1;
13201       break;
13202
13203     case OPTION_MSSE2AVX:
13204       sse2avx = 1;
13205       break;
13206
13207     case OPTION_MSSE_CHECK:
13208       if (strcasecmp (arg, "error") == 0)
13209         sse_check = check_error;
13210       else if (strcasecmp (arg, "warning") == 0)
13211         sse_check = check_warning;
13212       else if (strcasecmp (arg, "none") == 0)
13213         sse_check = check_none;
13214       else
13215         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13216       break;
13217
13218     case OPTION_MOPERAND_CHECK:
13219       if (strcasecmp (arg, "error") == 0)
13220         operand_check = check_error;
13221       else if (strcasecmp (arg, "warning") == 0)
13222         operand_check = check_warning;
13223       else if (strcasecmp (arg, "none") == 0)
13224         operand_check = check_none;
13225       else
13226         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13227       break;
13228
13229     case OPTION_MAVXSCALAR:
13230       if (strcasecmp (arg, "128") == 0)
13231         avxscalar = vex128;
13232       else if (strcasecmp (arg, "256") == 0)
13233         avxscalar = vex256;
13234       else
13235         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13236       break;
13237
13238     case OPTION_MVEXWIG:
13239       if (strcmp (arg, "0") == 0)
13240         vexwig = vexw0;
13241       else if (strcmp (arg, "1") == 0)
13242         vexwig = vexw1;
13243       else
13244         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13245       break;
13246
13247     case OPTION_MADD_BND_PREFIX:
13248       add_bnd_prefix = 1;
13249       break;
13250
13251     case OPTION_MEVEXLIG:
13252       if (strcmp (arg, "128") == 0)
13253         evexlig = evexl128;
13254       else if (strcmp (arg, "256") == 0)
13255         evexlig = evexl256;
13256       else  if (strcmp (arg, "512") == 0)
13257         evexlig = evexl512;
13258       else
13259         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13260       break;
13261
13262     case OPTION_MEVEXRCIG:
13263       if (strcmp (arg, "rne") == 0)
13264         evexrcig = rne;
13265       else if (strcmp (arg, "rd") == 0)
13266         evexrcig = rd;
13267       else if (strcmp (arg, "ru") == 0)
13268         evexrcig = ru;
13269       else if (strcmp (arg, "rz") == 0)
13270         evexrcig = rz;
13271       else
13272         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13273       break;
13274
13275     case OPTION_MEVEXWIG:
13276       if (strcmp (arg, "0") == 0)
13277         evexwig = evexw0;
13278       else if (strcmp (arg, "1") == 0)
13279         evexwig = evexw1;
13280       else
13281         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13282       break;
13283
13284 # if defined (TE_PE) || defined (TE_PEP)
13285     case OPTION_MBIG_OBJ:
13286       use_big_obj = 1;
13287       break;
13288 #endif
13289
13290     case OPTION_MOMIT_LOCK_PREFIX:
13291       if (strcasecmp (arg, "yes") == 0)
13292         omit_lock_prefix = 1;
13293       else if (strcasecmp (arg, "no") == 0)
13294         omit_lock_prefix = 0;
13295       else
13296         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13297       break;
13298
13299     case OPTION_MFENCE_AS_LOCK_ADD:
13300       if (strcasecmp (arg, "yes") == 0)
13301         avoid_fence = 1;
13302       else if (strcasecmp (arg, "no") == 0)
13303         avoid_fence = 0;
13304       else
13305         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13306       break;
13307
13308     case OPTION_MLFENCE_AFTER_LOAD:
13309       if (strcasecmp (arg, "yes") == 0)
13310         lfence_after_load = 1;
13311       else if (strcasecmp (arg, "no") == 0)
13312         lfence_after_load = 0;
13313       else
13314         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13315       break;
13316
13317     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13318       if (strcasecmp (arg, "all") == 0)
13319         {
13320           lfence_before_indirect_branch = lfence_branch_all;
13321           if (lfence_before_ret == lfence_before_ret_none)
13322             lfence_before_ret = lfence_before_ret_shl;
13323         }
13324       else if (strcasecmp (arg, "memory") == 0)
13325         lfence_before_indirect_branch = lfence_branch_memory;
13326       else if (strcasecmp (arg, "register") == 0)
13327         lfence_before_indirect_branch = lfence_branch_register;
13328       else if (strcasecmp (arg, "none") == 0)
13329         lfence_before_indirect_branch = lfence_branch_none;
13330       else
13331         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13332                   arg);
13333       break;
13334
13335     case OPTION_MLFENCE_BEFORE_RET:
13336       if (strcasecmp (arg, "or") == 0)
13337         lfence_before_ret = lfence_before_ret_or;
13338       else if (strcasecmp (arg, "not") == 0)
13339         lfence_before_ret = lfence_before_ret_not;
13340       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13341         lfence_before_ret = lfence_before_ret_shl;
13342       else if (strcasecmp (arg, "none") == 0)
13343         lfence_before_ret = lfence_before_ret_none;
13344       else
13345         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13346                   arg);
13347       break;
13348
13349     case OPTION_MRELAX_RELOCATIONS:
13350       if (strcasecmp (arg, "yes") == 0)
13351         generate_relax_relocations = 1;
13352       else if (strcasecmp (arg, "no") == 0)
13353         generate_relax_relocations = 0;
13354       else
13355         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13356       break;
13357
13358     case OPTION_MALIGN_BRANCH_BOUNDARY:
13359       {
13360         char *end;
13361         long int align = strtoul (arg, &end, 0);
13362         if (*end == '\0')
13363           {
13364             if (align == 0)
13365               {
13366                 align_branch_power = 0;
13367                 break;
13368               }
13369             else if (align >= 16)
13370               {
13371                 int align_power;
13372                 for (align_power = 0;
13373                      (align & 1) == 0;
13374                      align >>= 1, align_power++)
13375                   continue;
13376                 /* Limit alignment power to 31.  */
13377                 if (align == 1 && align_power < 32)
13378                   {
13379                     align_branch_power = align_power;
13380                     break;
13381                   }
13382               }
13383           }
13384         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13385       }
13386       break;
13387
13388     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13389       {
13390         char *end;
13391         int align = strtoul (arg, &end, 0);
13392         /* Some processors only support 5 prefixes.  */
13393         if (*end == '\0' && align >= 0 && align < 6)
13394           {
13395             align_branch_prefix_size = align;
13396             break;
13397           }
13398         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13399                   arg);
13400       }
13401       break;
13402
13403     case OPTION_MALIGN_BRANCH:
13404       align_branch = 0;
13405       saved = xstrdup (arg);
13406       type = saved;
13407       do
13408         {
13409           next = strchr (type, '+');
13410           if (next)
13411             *next++ = '\0';
13412           if (strcasecmp (type, "jcc") == 0)
13413             align_branch |= align_branch_jcc_bit;
13414           else if (strcasecmp (type, "fused") == 0)
13415             align_branch |= align_branch_fused_bit;
13416           else if (strcasecmp (type, "jmp") == 0)
13417             align_branch |= align_branch_jmp_bit;
13418           else if (strcasecmp (type, "call") == 0)
13419             align_branch |= align_branch_call_bit;
13420           else if (strcasecmp (type, "ret") == 0)
13421             align_branch |= align_branch_ret_bit;
13422           else if (strcasecmp (type, "indirect") == 0)
13423             align_branch |= align_branch_indirect_bit;
13424           else
13425             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13426           type = next;
13427         }
13428       while (next != NULL);
13429       free (saved);
13430       break;
13431
13432     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13433       align_branch_power = 5;
13434       align_branch_prefix_size = 5;
13435       align_branch = (align_branch_jcc_bit
13436                       | align_branch_fused_bit
13437                       | align_branch_jmp_bit);
13438       break;
13439
13440     case OPTION_MAMD64:
13441       isa64 = amd64;
13442       break;
13443
13444     case OPTION_MINTEL64:
13445       isa64 = intel64;
13446       break;
13447
13448     case 'O':
13449       if (arg == NULL)
13450         {
13451           optimize = 1;
13452           /* Turn off -Os.  */
13453           optimize_for_space = 0;
13454         }
13455       else if (*arg == 's')
13456         {
13457           optimize_for_space = 1;
13458           /* Turn on all encoding optimizations.  */
13459           optimize = INT_MAX;
13460         }
13461       else
13462         {
13463           optimize = atoi (arg);
13464           /* Turn off -Os.  */
13465           optimize_for_space = 0;
13466         }
13467       break;
13468
13469     default:
13470       return 0;
13471     }
13472   return 1;
13473 }
13474
13475 #define MESSAGE_TEMPLATE \
13476 "                                                                                "
13477
13478 static char *
13479 output_message (FILE *stream, char *p, char *message, char *start,
13480                 int *left_p, const char *name, int len)
13481 {
13482   int size = sizeof (MESSAGE_TEMPLATE);
13483   int left = *left_p;
13484
13485   /* Reserve 2 spaces for ", " or ",\0" */
13486   left -= len + 2;
13487
13488   /* Check if there is any room.  */
13489   if (left >= 0)
13490     {
13491       if (p != start)
13492         {
13493           *p++ = ',';
13494           *p++ = ' ';
13495         }
13496       p = mempcpy (p, name, len);
13497     }
13498   else
13499     {
13500       /* Output the current message now and start a new one.  */
13501       *p++ = ',';
13502       *p = '\0';
13503       fprintf (stream, "%s\n", message);
13504       p = start;
13505       left = size - (start - message) - len - 2;
13506
13507       gas_assert (left >= 0);
13508
13509       p = mempcpy (p, name, len);
13510     }
13511
13512   *left_p = left;
13513   return p;
13514 }
13515
13516 static void
13517 show_arch (FILE *stream, int ext, int check)
13518 {
13519   static char message[] = MESSAGE_TEMPLATE;
13520   char *start = message + 27;
13521   char *p;
13522   int size = sizeof (MESSAGE_TEMPLATE);
13523   int left;
13524   const char *name;
13525   int len;
13526   unsigned int j;
13527
13528   p = start;
13529   left = size - (start - message);
13530   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13531     {
13532       /* Should it be skipped?  */
13533       if (cpu_arch [j].skip)
13534         continue;
13535
13536       name = cpu_arch [j].name;
13537       len = cpu_arch [j].len;
13538       if (*name == '.')
13539         {
13540           /* It is an extension.  Skip if we aren't asked to show it.  */
13541           if (ext)
13542             {
13543               name++;
13544               len--;
13545             }
13546           else
13547             continue;
13548         }
13549       else if (ext)
13550         {
13551           /* It is an processor.  Skip if we show only extension.  */
13552           continue;
13553         }
13554       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13555         {
13556           /* It is an impossible processor - skip.  */
13557           continue;
13558         }
13559
13560       p = output_message (stream, p, message, start, &left, name, len);
13561     }
13562
13563   /* Display disabled extensions.  */
13564   if (ext)
13565     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13566       {
13567         name = cpu_noarch [j].name;
13568         len = cpu_noarch [j].len;
13569         p = output_message (stream, p, message, start, &left, name,
13570                             len);
13571       }
13572
13573   *p = '\0';
13574   fprintf (stream, "%s\n", message);
13575 }
13576
13577 void
13578 md_show_usage (FILE *stream)
13579 {
13580 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13581   fprintf (stream, _("\
13582   -Qy, -Qn                ignored\n\
13583   -V                      print assembler version number\n\
13584   -k                      ignored\n"));
13585 #endif
13586   fprintf (stream, _("\
13587   -n                      Do not optimize code alignment\n\
13588   -q                      quieten some warnings\n"));
13589 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13590   fprintf (stream, _("\
13591   -s                      ignored\n"));
13592 #endif
13593 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13594                       || defined (TE_PE) || defined (TE_PEP))
13595   fprintf (stream, _("\
13596   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13597 #endif
13598 #ifdef SVR4_COMMENT_CHARS
13599   fprintf (stream, _("\
13600   --divide                do not treat `/' as a comment character\n"));
13601 #else
13602   fprintf (stream, _("\
13603   --divide                ignored\n"));
13604 #endif
13605   fprintf (stream, _("\
13606   -march=CPU[,+EXTENSION...]\n\
13607                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13608   show_arch (stream, 0, 1);
13609   fprintf (stream, _("\
13610                           EXTENSION is combination of:\n"));
13611   show_arch (stream, 1, 0);
13612   fprintf (stream, _("\
13613   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13614   show_arch (stream, 0, 0);
13615   fprintf (stream, _("\
13616   -msse2avx               encode SSE instructions with VEX prefix\n"));
13617   fprintf (stream, _("\
13618   -msse-check=[none|error|warning] (default: warning)\n\
13619                           check SSE instructions\n"));
13620   fprintf (stream, _("\
13621   -moperand-check=[none|error|warning] (default: warning)\n\
13622                           check operand combinations for validity\n"));
13623   fprintf (stream, _("\
13624   -mavxscalar=[128|256] (default: 128)\n\
13625                           encode scalar AVX instructions with specific vector\n\
13626                            length\n"));
13627   fprintf (stream, _("\
13628   -mvexwig=[0|1] (default: 0)\n\
13629                           encode VEX instructions with specific VEX.W value\n\
13630                            for VEX.W bit ignored instructions\n"));
13631   fprintf (stream, _("\
13632   -mevexlig=[128|256|512] (default: 128)\n\
13633                           encode scalar EVEX instructions with specific vector\n\
13634                            length\n"));
13635   fprintf (stream, _("\
13636   -mevexwig=[0|1] (default: 0)\n\
13637                           encode EVEX instructions with specific EVEX.W value\n\
13638                            for EVEX.W bit ignored instructions\n"));
13639   fprintf (stream, _("\
13640   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13641                           encode EVEX instructions with specific EVEX.RC value\n\
13642                            for SAE-only ignored instructions\n"));
13643   fprintf (stream, _("\
13644   -mmnemonic=[att|intel] "));
13645   if (SYSV386_COMPAT)
13646     fprintf (stream, _("(default: att)\n"));
13647   else
13648     fprintf (stream, _("(default: intel)\n"));
13649   fprintf (stream, _("\
13650                           use AT&T/Intel mnemonic\n"));
13651   fprintf (stream, _("\
13652   -msyntax=[att|intel] (default: att)\n\
13653                           use AT&T/Intel syntax\n"));
13654   fprintf (stream, _("\
13655   -mindex-reg             support pseudo index registers\n"));
13656   fprintf (stream, _("\
13657   -mnaked-reg             don't require `%%' prefix for registers\n"));
13658   fprintf (stream, _("\
13659   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13660 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13661   fprintf (stream, _("\
13662   -mshared                disable branch optimization for shared code\n"));
13663   fprintf (stream, _("\
13664   -mx86-used-note=[no|yes] "));
13665   if (DEFAULT_X86_USED_NOTE)
13666     fprintf (stream, _("(default: yes)\n"));
13667   else
13668     fprintf (stream, _("(default: no)\n"));
13669   fprintf (stream, _("\
13670                           generate x86 used ISA and feature properties\n"));
13671 #endif
13672 #if defined (TE_PE) || defined (TE_PEP)
13673   fprintf (stream, _("\
13674   -mbig-obj               generate big object files\n"));
13675 #endif
13676   fprintf (stream, _("\
13677   -momit-lock-prefix=[no|yes] (default: no)\n\
13678                           strip all lock prefixes\n"));
13679   fprintf (stream, _("\
13680   -mfence-as-lock-add=[no|yes] (default: no)\n\
13681                           encode lfence, mfence and sfence as\n\
13682                            lock addl $0x0, (%%{re}sp)\n"));
13683   fprintf (stream, _("\
13684   -mrelax-relocations=[no|yes] "));
13685   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13686     fprintf (stream, _("(default: yes)\n"));
13687   else
13688     fprintf (stream, _("(default: no)\n"));
13689   fprintf (stream, _("\
13690                           generate relax relocations\n"));
13691   fprintf (stream, _("\
13692   -malign-branch-boundary=NUM (default: 0)\n\
13693                           align branches within NUM byte boundary\n"));
13694   fprintf (stream, _("\
13695   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13696                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13697                            indirect\n\
13698                           specify types of branches to align\n"));
13699   fprintf (stream, _("\
13700   -malign-branch-prefix-size=NUM (default: 5)\n\
13701                           align branches with NUM prefixes per instruction\n"));
13702   fprintf (stream, _("\
13703   -mbranches-within-32B-boundaries\n\
13704                           align branches within 32 byte boundary\n"));
13705   fprintf (stream, _("\
13706   -mlfence-after-load=[no|yes] (default: no)\n\
13707                           generate lfence after load\n"));
13708   fprintf (stream, _("\
13709   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13710                           generate lfence before indirect near branch\n"));
13711   fprintf (stream, _("\
13712   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13713                           generate lfence before ret\n"));
13714   fprintf (stream, _("\
13715   -mamd64                 accept only AMD64 ISA [default]\n"));
13716   fprintf (stream, _("\
13717   -mintel64               accept only Intel64 ISA\n"));
13718 }
13719
13720 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13721      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13722      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13723
13724 /* Pick the target format to use.  */
13725
13726 const char *
13727 i386_target_format (void)
13728 {
13729   if (!strncmp (default_arch, "x86_64", 6))
13730     {
13731       update_code_flag (CODE_64BIT, 1);
13732       if (default_arch[6] == '\0')
13733         x86_elf_abi = X86_64_ABI;
13734       else
13735         x86_elf_abi = X86_64_X32_ABI;
13736     }
13737   else if (!strcmp (default_arch, "i386"))
13738     update_code_flag (CODE_32BIT, 1);
13739   else if (!strcmp (default_arch, "iamcu"))
13740     {
13741       update_code_flag (CODE_32BIT, 1);
13742       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13743         {
13744           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13745           cpu_arch_name = "iamcu";
13746           cpu_sub_arch_name = NULL;
13747           cpu_arch_flags = iamcu_flags;
13748           cpu_arch_isa = PROCESSOR_IAMCU;
13749           cpu_arch_isa_flags = iamcu_flags;
13750           if (!cpu_arch_tune_set)
13751             {
13752               cpu_arch_tune = cpu_arch_isa;
13753               cpu_arch_tune_flags = cpu_arch_isa_flags;
13754             }
13755         }
13756       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13757         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13758                   cpu_arch_name);
13759     }
13760   else
13761     as_fatal (_("unknown architecture"));
13762
13763   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13764     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13765   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13766     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13767
13768   switch (OUTPUT_FLAVOR)
13769     {
13770 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13771     case bfd_target_aout_flavour:
13772       return AOUT_TARGET_FORMAT;
13773 #endif
13774 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13775 # if defined (TE_PE) || defined (TE_PEP)
13776     case bfd_target_coff_flavour:
13777       if (flag_code == CODE_64BIT)
13778         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13779       else
13780         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13781 # elif defined (TE_GO32)
13782     case bfd_target_coff_flavour:
13783       return "coff-go32";
13784 # else
13785     case bfd_target_coff_flavour:
13786       return "coff-i386";
13787 # endif
13788 #endif
13789 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13790     case bfd_target_elf_flavour:
13791       {
13792         const char *format;
13793
13794         switch (x86_elf_abi)
13795           {
13796           default:
13797             format = ELF_TARGET_FORMAT;
13798 #ifndef TE_SOLARIS
13799             tls_get_addr = "___tls_get_addr";
13800 #endif
13801             break;
13802           case X86_64_ABI:
13803             use_rela_relocations = 1;
13804             object_64bit = 1;
13805 #ifndef TE_SOLARIS
13806             tls_get_addr = "__tls_get_addr";
13807 #endif
13808             format = ELF_TARGET_FORMAT64;
13809             break;
13810           case X86_64_X32_ABI:
13811             use_rela_relocations = 1;
13812             object_64bit = 1;
13813 #ifndef TE_SOLARIS
13814             tls_get_addr = "__tls_get_addr";
13815 #endif
13816             disallow_64bit_reloc = 1;
13817             format = ELF_TARGET_FORMAT32;
13818             break;
13819           }
13820         if (cpu_arch_isa == PROCESSOR_L1OM)
13821           {
13822             if (x86_elf_abi != X86_64_ABI)
13823               as_fatal (_("Intel L1OM is 64bit only"));
13824             return ELF_TARGET_L1OM_FORMAT;
13825           }
13826         else if (cpu_arch_isa == PROCESSOR_K1OM)
13827           {
13828             if (x86_elf_abi != X86_64_ABI)
13829               as_fatal (_("Intel K1OM is 64bit only"));
13830             return ELF_TARGET_K1OM_FORMAT;
13831           }
13832         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13833           {
13834             if (x86_elf_abi != I386_ABI)
13835               as_fatal (_("Intel MCU is 32bit only"));
13836             return ELF_TARGET_IAMCU_FORMAT;
13837           }
13838         else
13839           return format;
13840       }
13841 #endif
13842 #if defined (OBJ_MACH_O)
13843     case bfd_target_mach_o_flavour:
13844       if (flag_code == CODE_64BIT)
13845         {
13846           use_rela_relocations = 1;
13847           object_64bit = 1;
13848           return "mach-o-x86-64";
13849         }
13850       else
13851         return "mach-o-i386";
13852 #endif
13853     default:
13854       abort ();
13855       return NULL;
13856     }
13857 }
13858
13859 #endif /* OBJ_MAYBE_ more than one  */
13860 \f
13861 symbolS *
13862 md_undefined_symbol (char *name)
13863 {
13864   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13865       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13866       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13867       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13868     {
13869       if (!GOT_symbol)
13870         {
13871           if (symbol_find (name))
13872             as_bad (_("GOT already in symbol table"));
13873           GOT_symbol = symbol_new (name, undefined_section,
13874                                    &zero_address_frag, 0);
13875         };
13876       return GOT_symbol;
13877     }
13878   return 0;
13879 }
13880
13881 /* Round up a section size to the appropriate boundary.  */
13882
13883 valueT
13884 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13885 {
13886 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13887   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13888     {
13889       /* For a.out, force the section size to be aligned.  If we don't do
13890          this, BFD will align it for us, but it will not write out the
13891          final bytes of the section.  This may be a bug in BFD, but it is
13892          easier to fix it here since that is how the other a.out targets
13893          work.  */
13894       int align;
13895
13896       align = bfd_section_alignment (segment);
13897       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13898     }
13899 #endif
13900
13901   return size;
13902 }
13903
13904 /* On the i386, PC-relative offsets are relative to the start of the
13905    next instruction.  That is, the address of the offset, plus its
13906    size, since the offset is always the last part of the insn.  */
13907
13908 long
13909 md_pcrel_from (fixS *fixP)
13910 {
13911   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13912 }
13913
13914 #ifndef I386COFF
13915
13916 static void
13917 s_bss (int ignore ATTRIBUTE_UNUSED)
13918 {
13919   int temp;
13920
13921 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13922   if (IS_ELF)
13923     obj_elf_section_change_hook ();
13924 #endif
13925   temp = get_absolute_expression ();
13926   subseg_set (bss_section, (subsegT) temp);
13927   demand_empty_rest_of_line ();
13928 }
13929
13930 #endif
13931
13932 /* Remember constant directive.  */
13933
13934 void
13935 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13936 {
13937   if (last_insn.kind != last_insn_directive
13938       && (bfd_section_flags (now_seg) & SEC_CODE))
13939     {
13940       last_insn.seg = now_seg;
13941       last_insn.kind = last_insn_directive;
13942       last_insn.name = "constant directive";
13943       last_insn.file = as_where (&last_insn.line);
13944       if (lfence_before_ret != lfence_before_ret_none)
13945         {
13946           if (lfence_before_indirect_branch != lfence_branch_none)
13947             as_warn (_("constant directive skips -mlfence-before-ret "
13948                        "and -mlfence-before-indirect-branch"));
13949           else
13950             as_warn (_("constant directive skips -mlfence-before-ret"));
13951         }
13952       else if (lfence_before_indirect_branch != lfence_branch_none)
13953         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13954     }
13955 }
13956
13957 void
13958 i386_validate_fix (fixS *fixp)
13959 {
13960   if (fixp->fx_subsy)
13961     {
13962       if (fixp->fx_subsy == GOT_symbol)
13963         {
13964           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13965             {
13966               if (!object_64bit)
13967                 abort ();
13968 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13969               if (fixp->fx_tcbit2)
13970                 fixp->fx_r_type = (fixp->fx_tcbit
13971                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13972                                    : BFD_RELOC_X86_64_GOTPCRELX);
13973               else
13974 #endif
13975                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13976             }
13977           else
13978             {
13979               if (!object_64bit)
13980                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13981               else
13982                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13983             }
13984           fixp->fx_subsy = 0;
13985         }
13986     }
13987 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13988   else
13989     {
13990       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
13991          to section.  Since PLT32 relocation must be against symbols,
13992          turn such PLT32 relocation into PC32 relocation.  */
13993       if (fixp->fx_addsy
13994           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
13995               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
13996           && symbol_section_p (fixp->fx_addsy))
13997         fixp->fx_r_type = BFD_RELOC_32_PCREL;
13998       if (!object_64bit)
13999         {
14000           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
14001               && fixp->fx_tcbit2)
14002             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14003         }
14004     }
14005 #endif
14006 }
14007
14008 arelent *
14009 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14010 {
14011   arelent *rel;
14012   bfd_reloc_code_real_type code;
14013
14014   switch (fixp->fx_r_type)
14015     {
14016 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14017     case BFD_RELOC_SIZE32:
14018     case BFD_RELOC_SIZE64:
14019       if (S_IS_DEFINED (fixp->fx_addsy)
14020           && !S_IS_EXTERNAL (fixp->fx_addsy))
14021         {
14022           /* Resolve size relocation against local symbol to size of
14023              the symbol plus addend.  */
14024           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
14025           if (fixp->fx_r_type == BFD_RELOC_SIZE32
14026               && !fits_in_unsigned_long (value))
14027             as_bad_where (fixp->fx_file, fixp->fx_line,
14028                           _("symbol size computation overflow"));
14029           fixp->fx_addsy = NULL;
14030           fixp->fx_subsy = NULL;
14031           md_apply_fix (fixp, (valueT *) &value, NULL);
14032           return NULL;
14033         }
14034 #endif
14035       /* Fall through.  */
14036
14037     case BFD_RELOC_X86_64_PLT32:
14038     case BFD_RELOC_X86_64_GOT32:
14039     case BFD_RELOC_X86_64_GOTPCREL:
14040     case BFD_RELOC_X86_64_GOTPCRELX:
14041     case BFD_RELOC_X86_64_REX_GOTPCRELX:
14042     case BFD_RELOC_386_PLT32:
14043     case BFD_RELOC_386_GOT32:
14044     case BFD_RELOC_386_GOT32X:
14045     case BFD_RELOC_386_GOTOFF:
14046     case BFD_RELOC_386_GOTPC:
14047     case BFD_RELOC_386_TLS_GD:
14048     case BFD_RELOC_386_TLS_LDM:
14049     case BFD_RELOC_386_TLS_LDO_32:
14050     case BFD_RELOC_386_TLS_IE_32:
14051     case BFD_RELOC_386_TLS_IE:
14052     case BFD_RELOC_386_TLS_GOTIE:
14053     case BFD_RELOC_386_TLS_LE_32:
14054     case BFD_RELOC_386_TLS_LE:
14055     case BFD_RELOC_386_TLS_GOTDESC:
14056     case BFD_RELOC_386_TLS_DESC_CALL:
14057     case BFD_RELOC_X86_64_TLSGD:
14058     case BFD_RELOC_X86_64_TLSLD:
14059     case BFD_RELOC_X86_64_DTPOFF32:
14060     case BFD_RELOC_X86_64_DTPOFF64:
14061     case BFD_RELOC_X86_64_GOTTPOFF:
14062     case BFD_RELOC_X86_64_TPOFF32:
14063     case BFD_RELOC_X86_64_TPOFF64:
14064     case BFD_RELOC_X86_64_GOTOFF64:
14065     case BFD_RELOC_X86_64_GOTPC32:
14066     case BFD_RELOC_X86_64_GOT64:
14067     case BFD_RELOC_X86_64_GOTPCREL64:
14068     case BFD_RELOC_X86_64_GOTPC64:
14069     case BFD_RELOC_X86_64_GOTPLT64:
14070     case BFD_RELOC_X86_64_PLTOFF64:
14071     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14072     case BFD_RELOC_X86_64_TLSDESC_CALL:
14073     case BFD_RELOC_RVA:
14074     case BFD_RELOC_VTABLE_ENTRY:
14075     case BFD_RELOC_VTABLE_INHERIT:
14076 #ifdef TE_PE
14077     case BFD_RELOC_32_SECREL:
14078 #endif
14079       code = fixp->fx_r_type;
14080       break;
14081     case BFD_RELOC_X86_64_32S:
14082       if (!fixp->fx_pcrel)
14083         {
14084           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
14085           code = fixp->fx_r_type;
14086           break;
14087         }
14088       /* Fall through.  */
14089     default:
14090       if (fixp->fx_pcrel)
14091         {
14092           switch (fixp->fx_size)
14093             {
14094             default:
14095               as_bad_where (fixp->fx_file, fixp->fx_line,
14096                             _("can not do %d byte pc-relative relocation"),
14097                             fixp->fx_size);
14098               code = BFD_RELOC_32_PCREL;
14099               break;
14100             case 1: code = BFD_RELOC_8_PCREL;  break;
14101             case 2: code = BFD_RELOC_16_PCREL; break;
14102             case 4: code = BFD_RELOC_32_PCREL; break;
14103 #ifdef BFD64
14104             case 8: code = BFD_RELOC_64_PCREL; break;
14105 #endif
14106             }
14107         }
14108       else
14109         {
14110           switch (fixp->fx_size)
14111             {
14112             default:
14113               as_bad_where (fixp->fx_file, fixp->fx_line,
14114                             _("can not do %d byte relocation"),
14115                             fixp->fx_size);
14116               code = BFD_RELOC_32;
14117               break;
14118             case 1: code = BFD_RELOC_8;  break;
14119             case 2: code = BFD_RELOC_16; break;
14120             case 4: code = BFD_RELOC_32; break;
14121 #ifdef BFD64
14122             case 8: code = BFD_RELOC_64; break;
14123 #endif
14124             }
14125         }
14126       break;
14127     }
14128
14129   if ((code == BFD_RELOC_32
14130        || code == BFD_RELOC_32_PCREL
14131        || code == BFD_RELOC_X86_64_32S)
14132       && GOT_symbol
14133       && fixp->fx_addsy == GOT_symbol)
14134     {
14135       if (!object_64bit)
14136         code = BFD_RELOC_386_GOTPC;
14137       else
14138         code = BFD_RELOC_X86_64_GOTPC32;
14139     }
14140   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14141       && GOT_symbol
14142       && fixp->fx_addsy == GOT_symbol)
14143     {
14144       code = BFD_RELOC_X86_64_GOTPC64;
14145     }
14146
14147   rel = XNEW (arelent);
14148   rel->sym_ptr_ptr = XNEW (asymbol *);
14149   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14150
14151   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14152
14153   if (!use_rela_relocations)
14154     {
14155       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14156          vtable entry to be used in the relocation's section offset.  */
14157       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14158         rel->address = fixp->fx_offset;
14159 #if defined (OBJ_COFF) && defined (TE_PE)
14160       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14161         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14162       else
14163 #endif
14164       rel->addend = 0;
14165     }
14166   /* Use the rela in 64bit mode.  */
14167   else
14168     {
14169       if (disallow_64bit_reloc)
14170         switch (code)
14171           {
14172           case BFD_RELOC_X86_64_DTPOFF64:
14173           case BFD_RELOC_X86_64_TPOFF64:
14174           case BFD_RELOC_64_PCREL:
14175           case BFD_RELOC_X86_64_GOTOFF64:
14176           case BFD_RELOC_X86_64_GOT64:
14177           case BFD_RELOC_X86_64_GOTPCREL64:
14178           case BFD_RELOC_X86_64_GOTPC64:
14179           case BFD_RELOC_X86_64_GOTPLT64:
14180           case BFD_RELOC_X86_64_PLTOFF64:
14181             as_bad_where (fixp->fx_file, fixp->fx_line,
14182                           _("cannot represent relocation type %s in x32 mode"),
14183                           bfd_get_reloc_code_name (code));
14184             break;
14185           default:
14186             break;
14187           }
14188
14189       if (!fixp->fx_pcrel)
14190         rel->addend = fixp->fx_offset;
14191       else
14192         switch (code)
14193           {
14194           case BFD_RELOC_X86_64_PLT32:
14195           case BFD_RELOC_X86_64_GOT32:
14196           case BFD_RELOC_X86_64_GOTPCREL:
14197           case BFD_RELOC_X86_64_GOTPCRELX:
14198           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14199           case BFD_RELOC_X86_64_TLSGD:
14200           case BFD_RELOC_X86_64_TLSLD:
14201           case BFD_RELOC_X86_64_GOTTPOFF:
14202           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14203           case BFD_RELOC_X86_64_TLSDESC_CALL:
14204             rel->addend = fixp->fx_offset - fixp->fx_size;
14205             break;
14206           default:
14207             rel->addend = (section->vma
14208                            - fixp->fx_size
14209                            + fixp->fx_addnumber
14210                            + md_pcrel_from (fixp));
14211             break;
14212           }
14213     }
14214
14215   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14216   if (rel->howto == NULL)
14217     {
14218       as_bad_where (fixp->fx_file, fixp->fx_line,
14219                     _("cannot represent relocation type %s"),
14220                     bfd_get_reloc_code_name (code));
14221       /* Set howto to a garbage value so that we can keep going.  */
14222       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14223       gas_assert (rel->howto != NULL);
14224     }
14225
14226   return rel;
14227 }
14228
14229 #include "tc-i386-intel.c"
14230
14231 void
14232 tc_x86_parse_to_dw2regnum (expressionS *exp)
14233 {
14234   int saved_naked_reg;
14235   char saved_register_dot;
14236
14237   saved_naked_reg = allow_naked_reg;
14238   allow_naked_reg = 1;
14239   saved_register_dot = register_chars['.'];
14240   register_chars['.'] = '.';
14241   allow_pseudo_reg = 1;
14242   expression_and_evaluate (exp);
14243   allow_pseudo_reg = 0;
14244   register_chars['.'] = saved_register_dot;
14245   allow_naked_reg = saved_naked_reg;
14246
14247   if (exp->X_op == O_register && exp->X_add_number >= 0)
14248     {
14249       if ((addressT) exp->X_add_number < i386_regtab_size)
14250         {
14251           exp->X_op = O_constant;
14252           exp->X_add_number = i386_regtab[exp->X_add_number]
14253                               .dw2_regnum[flag_code >> 1];
14254         }
14255       else
14256         exp->X_op = O_illegal;
14257     }
14258 }
14259
14260 void
14261 tc_x86_frame_initial_instructions (void)
14262 {
14263   static unsigned int sp_regno[2];
14264
14265   if (!sp_regno[flag_code >> 1])
14266     {
14267       char *saved_input = input_line_pointer;
14268       char sp[][4] = {"esp", "rsp"};
14269       expressionS exp;
14270
14271       input_line_pointer = sp[flag_code >> 1];
14272       tc_x86_parse_to_dw2regnum (&exp);
14273       gas_assert (exp.X_op == O_constant);
14274       sp_regno[flag_code >> 1] = exp.X_add_number;
14275       input_line_pointer = saved_input;
14276     }
14277
14278   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14279   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14280 }
14281
14282 int
14283 x86_dwarf2_addr_size (void)
14284 {
14285 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14286   if (x86_elf_abi == X86_64_X32_ABI)
14287     return 4;
14288 #endif
14289   return bfd_arch_bits_per_address (stdoutput) / 8;
14290 }
14291
14292 int
14293 i386_elf_section_type (const char *str, size_t len)
14294 {
14295   if (flag_code == CODE_64BIT
14296       && len == sizeof ("unwind") - 1
14297       && strncmp (str, "unwind", 6) == 0)
14298     return SHT_X86_64_UNWIND;
14299
14300   return -1;
14301 }
14302
14303 #ifdef TE_SOLARIS
14304 void
14305 i386_solaris_fix_up_eh_frame (segT sec)
14306 {
14307   if (flag_code == CODE_64BIT)
14308     elf_section_type (sec) = SHT_X86_64_UNWIND;
14309 }
14310 #endif
14311
14312 #ifdef TE_PE
14313 void
14314 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14315 {
14316   expressionS exp;
14317
14318   exp.X_op = O_secrel;
14319   exp.X_add_symbol = symbol;
14320   exp.X_add_number = 0;
14321   emit_expr (&exp, size);
14322 }
14323 #endif
14324
14325 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14326 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14327
14328 bfd_vma
14329 x86_64_section_letter (int letter, const char **ptr_msg)
14330 {
14331   if (flag_code == CODE_64BIT)
14332     {
14333       if (letter == 'l')
14334         return SHF_X86_64_LARGE;
14335
14336       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14337     }
14338   else
14339     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14340   return -1;
14341 }
14342
14343 bfd_vma
14344 x86_64_section_word (char *str, size_t len)
14345 {
14346   if (len == 5 && flag_code == CODE_64BIT && startswith (str, "large"))
14347     return SHF_X86_64_LARGE;
14348
14349   return -1;
14350 }
14351
14352 static void
14353 handle_large_common (int small ATTRIBUTE_UNUSED)
14354 {
14355   if (flag_code != CODE_64BIT)
14356     {
14357       s_comm_internal (0, elf_common_parse);
14358       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14359     }
14360   else
14361     {
14362       static segT lbss_section;
14363       asection *saved_com_section_ptr = elf_com_section_ptr;
14364       asection *saved_bss_section = bss_section;
14365
14366       if (lbss_section == NULL)
14367         {
14368           flagword applicable;
14369           segT seg = now_seg;
14370           subsegT subseg = now_subseg;
14371
14372           /* The .lbss section is for local .largecomm symbols.  */
14373           lbss_section = subseg_new (".lbss", 0);
14374           applicable = bfd_applicable_section_flags (stdoutput);
14375           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14376           seg_info (lbss_section)->bss = 1;
14377
14378           subseg_set (seg, subseg);
14379         }
14380
14381       elf_com_section_ptr = &_bfd_elf_large_com_section;
14382       bss_section = lbss_section;
14383
14384       s_comm_internal (0, elf_common_parse);
14385
14386       elf_com_section_ptr = saved_com_section_ptr;
14387       bss_section = saved_bss_section;
14388     }
14389 }
14390 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */