gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* This struct describes rounding control and SAE in the instruction.  */
 214 struct RC_Operation
 215 {
 216   enum rc_type
 217     {
 218       rne = 0,
 219       rd,
 220       ru,
 221       rz,
 222       saeonly
 223     } type;
 224   int operand;
 225 };
 226
 227 static struct RC_Operation rc_op;
 228
 229 /* The struct describes masking, applied to OPERAND in the instruction.
 230    MASK is a pointer to the corresponding mask register.  ZEROING tells
 231    whether merging or zeroing mask is used.  */
 232 struct Mask_Operation
 233 {
 234   const reg_entry *mask;
 235   unsigned int zeroing;
 236   /* The operand where this operation is associated.  */
 237   int operand;
 238 };
 239
 240 static struct Mask_Operation mask_op;
 241
 242 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 243    broadcast factor.  */
 244 struct Broadcast_Operation
 245 {
 246   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 247   int type;
 248
 249   /* Index of broadcasted operand.  */
 250   int operand;
 251
 252   /* Number of bytes to broadcast.  */
 253   int bytes;
 254 };
 255
 256 static struct Broadcast_Operation broadcast_op;
 257
 258 /* VEX prefix.  */
 259 typedef struct
 260 {
 261   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 262   unsigned char bytes[4];
 263   unsigned int length;
 264   /* Destination or source register specifier.  */
 265   const reg_entry *register_specifier;
 266 } vex_prefix;
 267
 268 /* 'md_assemble ()' gathers together information and puts it into a
 269    i386_insn.  */
 270
 271 union i386_op
 272   {
 273     expressionS *disps;
 274     expressionS *imms;
 275     const reg_entry *regs;
 276   };
 277
 278 enum i386_error
 279   {
 280     operand_size_mismatch,
 281     operand_type_mismatch,
 282     register_type_mismatch,
 283     number_of_operands_mismatch,
 284     invalid_instruction_suffix,
 285     bad_imm4,
 286     unsupported_with_intel_mnemonic,
 287     unsupported_syntax,
 288     unsupported,
 289     invalid_vsib_address,
 290     invalid_vector_register_set,
 291     unsupported_vector_index_register,
 292     unsupported_broadcast,
 293     broadcast_needed,
 294     unsupported_masking,
 295     mask_not_on_destination,
 296     no_default_mask,
 297     unsupported_rc_sae,
 298     rc_sae_operand_not_last_imm,
 299     invalid_register_operand,
 300   };
 301
 302 struct _i386_insn
 303   {
 304     /* TM holds the template for the insn were currently assembling.  */
 305     insn_template tm;
 306
 307     /* SUFFIX holds the instruction size suffix for byte, word, dword
 308        or qword, if given.  */
 309     char suffix;
 310
 311     /* OPERANDS gives the number of given operands.  */
 312     unsigned int operands;
 313
 314     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 315        of given register, displacement, memory operands and immediate
 316        operands.  */
 317     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 318
 319     /* TYPES [i] is the type (see above #defines) which tells us how to
 320        use OP[i] for the corresponding operand.  */
 321     i386_operand_type types[MAX_OPERANDS];
 322
 323     /* Displacement expression, immediate expression, or register for each
 324        operand.  */
 325     union i386_op op[MAX_OPERANDS];
 326
 327     /* Flags for operands.  */
 328     unsigned int flags[MAX_OPERANDS];
 329 #define Operand_PCrel 1
 330 #define Operand_Mem   2
 331
 332     /* Relocation type for operand */
 333     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 334
 335     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 336        the base index byte below.  */
 337     const reg_entry *base_reg;
 338     const reg_entry *index_reg;
 339     unsigned int log2_scale_factor;
 340
 341     /* SEG gives the seg_entries of this insn.  They are zero unless
 342        explicit segment overrides are given.  */
 343     const seg_entry *seg[2];
 344
 345     /* Copied first memory operand string, for re-checking.  */
 346     char *memop1_string;
 347
 348     /* PREFIX holds all the given prefix opcodes (usually null).
 349        PREFIXES is the number of prefix opcodes.  */
 350     unsigned int prefixes;
 351     unsigned char prefix[MAX_PREFIXES];
 352
 353     /* Register is in low 3 bits of opcode.  */
 354     bfd_boolean short_form;
 355
 356     /* The operand to a branch insn indicates an absolute branch.  */
 357     bfd_boolean jumpabsolute;
 358
 359     /* Has MMX register operands.  */
 360     bfd_boolean has_regmmx;
 361
 362     /* Has XMM register operands.  */
 363     bfd_boolean has_regxmm;
 364
 365     /* Has YMM register operands.  */
 366     bfd_boolean has_regymm;
 367
 368     /* Has ZMM register operands.  */
 369     bfd_boolean has_regzmm;
 370
 371     /* Has GOTPC or TLS relocation.  */
 372     bfd_boolean has_gotpc_tls_reloc;
 373
 374     /* RM and SIB are the modrm byte and the sib byte where the
 375        addressing modes of this insn are encoded.  */
 376     modrm_byte rm;
 377     rex_byte rex;
 378     rex_byte vrex;
 379     sib_byte sib;
 380     vex_prefix vex;
 381
 382     /* Masking attributes.  */
 383     struct Mask_Operation *mask;
 384
 385     /* Rounding control and SAE attributes.  */
 386     struct RC_Operation *rounding;
 387
 388     /* Broadcasting attributes.  */
 389     struct Broadcast_Operation *broadcast;
 390
 391     /* Compressed disp8*N attribute.  */
 392     unsigned int memshift;
 393
 394     /* Prefer load or store in encoding.  */
 395     enum
 396       {
 397         dir_encoding_default = 0,
 398         dir_encoding_load,
 399         dir_encoding_store,
 400         dir_encoding_swap
 401       } dir_encoding;
 402
 403     /* Prefer 8bit or 32bit displacement in encoding.  */
 404     enum
 405       {
 406         disp_encoding_default = 0,
 407         disp_encoding_8bit,
 408         disp_encoding_32bit
 409       } disp_encoding;
 410
 411     /* Prefer the REX byte in encoding.  */
 412     bfd_boolean rex_encoding;
 413
 414     /* Disable instruction size optimization.  */
 415     bfd_boolean no_optimize;
 416
 417     /* How to encode vector instructions.  */
 418     enum
 419       {
 420         vex_encoding_default = 0,
 421         vex_encoding_vex,
 422         vex_encoding_vex3,
 423         vex_encoding_evex
 424       } vec_encoding;
 425
 426     /* REP prefix.  */
 427     const char *rep_prefix;
 428
 429     /* HLE prefix.  */
 430     const char *hle_prefix;
 431
 432     /* Have BND prefix.  */
 433     const char *bnd_prefix;
 434
 435     /* Have NOTRACK prefix.  */
 436     const char *notrack_prefix;
 437
 438     /* Error message.  */
 439     enum i386_error error;
 440   };
 441
 442 typedef struct _i386_insn i386_insn;
 443
 444 /* Link RC type with corresponding string, that'll be looked for in
 445    asm.  */
 446 struct RC_name
 447 {
 448   enum rc_type type;
 449   const char *name;
 450   unsigned int len;
 451 };
 452
 453 static const struct RC_name RC_NamesTable[] =
 454 {
 455   {  rne, STRING_COMMA_LEN ("rn-sae") },
 456   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 457   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 458   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 459   {  saeonly,  STRING_COMMA_LEN ("sae") },
 460 };
 461
 462 /* List of chars besides those in app.c:symbol_chars that can start an
 463    operand.  Used to prevent the scrubber eating vital white-space.  */
 464 const char extra_symbol_chars[] = "*%-([{}"
 465 #ifdef LEX_AT
 466         "@"
 467 #endif
 468 #ifdef LEX_QM
 469         "?"
 470 #endif
 471         ;
 472
 473 #if (defined (TE_I386AIX)                               \
 474      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 475          && !defined (TE_GNU)                           \
 476          && !defined (TE_LINUX)                         \
 477          && !defined (TE_NACL)                          \
 478          && !defined (TE_FreeBSD)                       \
 479          && !defined (TE_DragonFly)                     \
 480          && !defined (TE_NetBSD)))
 481 /* This array holds the chars that always start a comment.  If the
 482    pre-processor is disabled, these aren't very useful.  The option
 483    --divide will remove '/' from this list.  */
 484 const char *i386_comment_chars = "#/";
 485 #define SVR4_COMMENT_CHARS 1
 486 #define PREFIX_SEPARATOR '\\'
 487
 488 #else
 489 const char *i386_comment_chars = "#";
 490 #define PREFIX_SEPARATOR '/'
 491 #endif
 492
 493 /* This array holds the chars that only start a comment at the beginning of
 494    a line.  If the line seems to have the form '# 123 filename'
 495    .line and .file directives will appear in the pre-processed output.
 496    Note that input_file.c hand checks for '#' at the beginning of the
 497    first line of the input file.  This is because the compiler outputs
 498    #NO_APP at the beginning of its output.
 499    Also note that comments started like this one will always work if
 500    '/' isn't otherwise defined.  */
 501 const char line_comment_chars[] = "#/";
 502
 503 const char line_separator_chars[] = ";";
 504
 505 /* Chars that can be used to separate mant from exp in floating point
 506    nums.  */
 507 const char EXP_CHARS[] = "eE";
 508
 509 /* Chars that mean this number is a floating point constant
 510    As in 0f12.456
 511    or    0d1.2345e12.  */
 512 const char FLT_CHARS[] = "fFdDxX";
 513
 514 /* Tables for lexical analysis.  */
 515 static char mnemonic_chars[256];
 516 static char register_chars[256];
 517 static char operand_chars[256];
 518 static char identifier_chars[256];
 519 static char digit_chars[256];
 520
 521 /* Lexical macros.  */
 522 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 523 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 524 #define is_register_char(x) (register_chars[(unsigned char) x])
 525 #define is_space_char(x) ((x) == ' ')
 526 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 527 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 528
 529 /* All non-digit non-letter characters that may occur in an operand.  */
 530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 531
 532 /* md_assemble() always leaves the strings it's passed unaltered.  To
 533    effect this we maintain a stack of saved characters that we've smashed
 534    with '\0's (indicating end of strings for various sub-fields of the
 535    assembler instruction).  */
 536 static char save_stack[32];
 537 static char *save_stack_p;
 538 #define END_STRING_AND_SAVE(s) \
 539         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 540 #define RESTORE_END_STRING(s) \
 541         do { *(s) = *--save_stack_p; } while (0)
 542
 543 /* The instruction we're assembling.  */
 544 static i386_insn i;
 545
 546 /* Possible templates for current insn.  */
 547 static const templates *current_templates;
 548
 549 /* Per instruction expressionS buffers: max displacements & immediates.  */
 550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 552
 553 /* Current operand we are working on.  */
 554 static int this_operand = -1;
 555
 556 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 557    these.  */
 558
 559 enum flag_code {
 560         CODE_32BIT,
 561         CODE_16BIT,
 562         CODE_64BIT };
 563
 564 static enum flag_code flag_code;
 565 static unsigned int object_64bit;
 566 static unsigned int disallow_64bit_reloc;
 567 static int use_rela_relocations = 0;
 568 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 569 static const char *tls_get_addr;
 570
 571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 572      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 573      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 574
 575 /* The ELF ABI to use.  */
 576 enum x86_elf_abi
 577 {
 578   I386_ABI,
 579   X86_64_ABI,
 580   X86_64_X32_ABI
 581 };
 582
 583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 584 #endif
 585
 586 #if defined (TE_PE) || defined (TE_PEP)
 587 /* Use big object file format.  */
 588 static int use_big_obj = 0;
 589 #endif
 590
 591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 592 /* 1 if generating code for a shared library.  */
 593 static int shared = 0;
 594 #endif
 595
 596 /* 1 for intel syntax,
 597    0 if att syntax.  */
 598 static int intel_syntax = 0;
 599
 600 static enum x86_64_isa
 601 {
 602   amd64 = 1,    /* AMD64 ISA.  */
 603   intel64       /* Intel64 ISA.  */
 604 } isa64;
 605
 606 /* 1 for intel mnemonic,
 607    0 if att mnemonic.  */
 608 static int intel_mnemonic = !SYSV386_COMPAT;
 609
 610 /* 1 if pseudo registers are permitted.  */
 611 static int allow_pseudo_reg = 0;
 612
 613 /* 1 if register prefix % not required.  */
 614 static int allow_naked_reg = 0;
 615
 616 /* 1 if the assembler should add BND prefix for all control-transferring
 617    instructions supporting it, even if this prefix wasn't specified
 618    explicitly.  */
 619 static int add_bnd_prefix = 0;
 620
 621 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 622 static int allow_index_reg = 0;
 623
 624 /* 1 if the assembler should ignore LOCK prefix, even if it was
 625    specified explicitly.  */
 626 static int omit_lock_prefix = 0;
 627
 628 /* 1 if the assembler should encode lfence, mfence, and sfence as
 629    "lock addl $0, (%{re}sp)".  */
 630 static int avoid_fence = 0;
 631
 632 /* Type of the previous instruction.  */
 633 static struct
 634   {
 635     segT seg;
 636     const char *file;
 637     const char *name;
 638     unsigned int line;
 639     enum last_insn_kind
 640       {
 641         last_insn_other = 0,
 642         last_insn_directive,
 643         last_insn_prefix
 644       } kind;
 645   } last_insn;
 646
 647 /* 1 if the assembler should generate relax relocations.  */
 648
 649 static int generate_relax_relocations
 650   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 651
 652 static enum check_kind
 653   {
 654     check_none = 0,
 655     check_warning,
 656     check_error
 657   }
 658 sse_check, operand_check = check_warning;
 659
 660 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 661 static int align_branch_power = 0;
 662
 663 /* Types of branches to align.  */
 664 enum align_branch_kind
 665   {
 666     align_branch_none = 0,
 667     align_branch_jcc = 1,
 668     align_branch_fused = 2,
 669     align_branch_jmp = 3,
 670     align_branch_call = 4,
 671     align_branch_indirect = 5,
 672     align_branch_ret = 6
 673   };
 674
 675 /* Type bits of branches to align.  */
 676 enum align_branch_bit
 677   {
 678     align_branch_jcc_bit = 1 << align_branch_jcc,
 679     align_branch_fused_bit = 1 << align_branch_fused,
 680     align_branch_jmp_bit = 1 << align_branch_jmp,
 681     align_branch_call_bit = 1 << align_branch_call,
 682     align_branch_indirect_bit = 1 << align_branch_indirect,
 683     align_branch_ret_bit = 1 << align_branch_ret
 684   };
 685
 686 static unsigned int align_branch = (align_branch_jcc_bit
 687                                     | align_branch_fused_bit
 688                                     | align_branch_jmp_bit);
 689
 690 /* The maximum padding size for fused jcc.  CMP like instruction can
 691    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 692    prefixes.   */
 693 #define MAX_FUSED_JCC_PADDING_SIZE 20
 694
 695 /* The maximum number of prefixes added for an instruction.  */
 696 static unsigned int align_branch_prefix_size = 5;
 697
 698 /* Optimization:
 699    1. Clear the REX_W bit with register operand if possible.
 700    2. Above plus use 128bit vector instruction to clear the full vector
 701       register.
 702  */
 703 static int optimize = 0;
 704
 705 /* Optimization:
 706    1. Clear the REX_W bit with register operand if possible.
 707    2. Above plus use 128bit vector instruction to clear the full vector
 708       register.
 709    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 710       "testb $imm7,%r8".
 711  */
 712 static int optimize_for_space = 0;
 713
 714 /* Register prefix used for error message.  */
 715 static const char *register_prefix = "%";
 716
 717 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 718    leave, push, and pop instructions so that gcc has the same stack
 719    frame as in 32 bit mode.  */
 720 static char stackop_size = '\0';
 721
 722 /* Non-zero to optimize code alignment.  */
 723 int optimize_align_code = 1;
 724
 725 /* Non-zero to quieten some warnings.  */
 726 static int quiet_warnings = 0;
 727
 728 /* CPU name.  */
 729 static const char *cpu_arch_name = NULL;
 730 static char *cpu_sub_arch_name = NULL;
 731
 732 /* CPU feature flags.  */
 733 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 734
 735 /* If we have selected a cpu we are generating instructions for.  */
 736 static int cpu_arch_tune_set = 0;
 737
 738 /* Cpu we are generating instructions for.  */
 739 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 740
 741 /* CPU feature flags of cpu we are generating instructions for.  */
 742 static i386_cpu_flags cpu_arch_tune_flags;
 743
 744 /* CPU instruction set architecture used.  */
 745 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 746
 747 /* CPU feature flags of instruction set architecture used.  */
 748 i386_cpu_flags cpu_arch_isa_flags;
 749
 750 /* If set, conditional jumps are not automatically promoted to handle
 751    larger than a byte offset.  */
 752 static unsigned int no_cond_jump_promotion = 0;
 753
 754 /* Encode SSE instructions with VEX prefix.  */
 755 static unsigned int sse2avx;
 756
 757 /* Encode scalar AVX instructions with specific vector length.  */
 758 static enum
 759   {
 760     vex128 = 0,
 761     vex256
 762   } avxscalar;
 763
 764 /* Encode VEX WIG instructions with specific vex.w.  */
 765 static enum
 766   {
 767     vexw0 = 0,
 768     vexw1
 769   } vexwig;
 770
 771 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 772 static enum
 773   {
 774     evexl128 = 0,
 775     evexl256,
 776     evexl512
 777   } evexlig;
 778
 779 /* Encode EVEX WIG instructions with specific evex.w.  */
 780 static enum
 781   {
 782     evexw0 = 0,
 783     evexw1
 784   } evexwig;
 785
 786 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 787 static enum rc_type evexrcig = rne;
 788
 789 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 790 static symbolS *GOT_symbol;
 791
 792 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 793 unsigned int x86_dwarf2_return_column;
 794
 795 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 796 int x86_cie_data_alignment;
 797
 798 /* Interface to relax_segment.
 799    There are 3 major relax states for 386 jump insns because the
 800    different types of jumps add different sizes to frags when we're
 801    figuring out what sort of jump to choose to reach a given label.
 802
 803    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 804    branches which are handled by md_estimate_size_before_relax() and
 805    i386_generic_table_relax_frag().  */
 806
 807 /* Types.  */
 808 #define UNCOND_JUMP 0
 809 #define COND_JUMP 1
 810 #define COND_JUMP86 2
 811 #define BRANCH_PADDING 3
 812 #define BRANCH_PREFIX 4
 813 #define FUSED_JCC_PADDING 5
 814
 815 /* Sizes.  */
 816 #define CODE16  1
 817 #define SMALL   0
 818 #define SMALL16 (SMALL | CODE16)
 819 #define BIG     2
 820 #define BIG16   (BIG | CODE16)
 821
 822 #ifndef INLINE
 823 #ifdef __GNUC__
 824 #define INLINE __inline__
 825 #else
 826 #define INLINE
 827 #endif
 828 #endif
 829
 830 #define ENCODE_RELAX_STATE(type, size) \
 831   ((relax_substateT) (((type) << 2) | (size)))
 832 #define TYPE_FROM_RELAX_STATE(s) \
 833   ((s) >> 2)
 834 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 835     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 836
 837 /* This table is used by relax_frag to promote short jumps to long
 838    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 839    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 840    don't allow a short jump in a 32 bit code segment to be promoted to
 841    a 16 bit offset jump because it's slower (requires data size
 842    prefix), and doesn't work, unless the destination is in the bottom
 843    64k of the code segment (The top 16 bits of eip are zeroed).  */
 844
 845 const relax_typeS md_relax_table[] =
 846 {
 847   /* The fields are:
 848      1) most positive reach of this state,
 849      2) most negative reach of this state,
 850      3) how many bytes this mode will have in the variable part of the frag
 851      4) which index into the table to try if we can't fit into this one.  */
 852
 853   /* UNCOND_JUMP states.  */
 854   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 855   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 856   /* dword jmp adds 4 bytes to frag:
 857      0 extra opcode bytes, 4 displacement bytes.  */
 858   {0, 0, 4, 0},
 859   /* word jmp adds 2 byte2 to frag:
 860      0 extra opcode bytes, 2 displacement bytes.  */
 861   {0, 0, 2, 0},
 862
 863   /* COND_JUMP states.  */
 864   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 865   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 866   /* dword conditionals adds 5 bytes to frag:
 867      1 extra opcode byte, 4 displacement bytes.  */
 868   {0, 0, 5, 0},
 869   /* word conditionals add 3 bytes to frag:
 870      1 extra opcode byte, 2 displacement bytes.  */
 871   {0, 0, 3, 0},
 872
 873   /* COND_JUMP86 states.  */
 874   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 875   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 876   /* dword conditionals adds 5 bytes to frag:
 877      1 extra opcode byte, 4 displacement bytes.  */
 878   {0, 0, 5, 0},
 879   /* word conditionals add 4 bytes to frag:
 880      1 displacement byte and a 3 byte long branch insn.  */
 881   {0, 0, 4, 0}
 882 };
 883
 884 static const arch_entry cpu_arch[] =
 885 {
 886   /* Do not replace the first two entries - i386_target_format()
 887      relies on them being there in this order.  */
 888   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 889     CPU_GENERIC32_FLAGS, 0 },
 890   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 891     CPU_GENERIC64_FLAGS, 0 },
 892   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 893     CPU_NONE_FLAGS, 0 },
 894   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 895     CPU_I186_FLAGS, 0 },
 896   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 897     CPU_I286_FLAGS, 0 },
 898   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 899     CPU_I386_FLAGS, 0 },
 900   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 901     CPU_I486_FLAGS, 0 },
 902   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 903     CPU_I586_FLAGS, 0 },
 904   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 905     CPU_I686_FLAGS, 0 },
 906   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 907     CPU_I586_FLAGS, 0 },
 908   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 909     CPU_PENTIUMPRO_FLAGS, 0 },
 910   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 911     CPU_P2_FLAGS, 0 },
 912   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 913     CPU_P3_FLAGS, 0 },
 914   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 915     CPU_P4_FLAGS, 0 },
 916   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 917     CPU_CORE_FLAGS, 0 },
 918   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 919     CPU_NOCONA_FLAGS, 0 },
 920   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 921     CPU_CORE_FLAGS, 1 },
 922   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 923     CPU_CORE_FLAGS, 0 },
 924   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 925     CPU_CORE2_FLAGS, 1 },
 926   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 927     CPU_CORE2_FLAGS, 0 },
 928   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 929     CPU_COREI7_FLAGS, 0 },
 930   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 931     CPU_L1OM_FLAGS, 0 },
 932   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 933     CPU_K1OM_FLAGS, 0 },
 934   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 935     CPU_IAMCU_FLAGS, 0 },
 936   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 937     CPU_K6_FLAGS, 0 },
 938   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 939     CPU_K6_2_FLAGS, 0 },
 940   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 941     CPU_ATHLON_FLAGS, 0 },
 942   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 943     CPU_K8_FLAGS, 1 },
 944   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 945     CPU_K8_FLAGS, 0 },
 946   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 947     CPU_K8_FLAGS, 0 },
 948   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 949     CPU_AMDFAM10_FLAGS, 0 },
 950   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 951     CPU_BDVER1_FLAGS, 0 },
 952   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 953     CPU_BDVER2_FLAGS, 0 },
 954   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 955     CPU_BDVER3_FLAGS, 0 },
 956   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 957     CPU_BDVER4_FLAGS, 0 },
 958   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
 959     CPU_ZNVER1_FLAGS, 0 },
 960   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
 961     CPU_ZNVER2_FLAGS, 0 },
 962   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 963     CPU_BTVER1_FLAGS, 0 },
 964   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 965     CPU_BTVER2_FLAGS, 0 },
 966   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 967     CPU_8087_FLAGS, 0 },
 968   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 969     CPU_287_FLAGS, 0 },
 970   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 971     CPU_387_FLAGS, 0 },
 972   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
 973     CPU_687_FLAGS, 0 },
 974   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
 975     CPU_CMOV_FLAGS, 0 },
 976   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
 977     CPU_FXSR_FLAGS, 0 },
 978   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 979     CPU_MMX_FLAGS, 0 },
 980   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 981     CPU_SSE_FLAGS, 0 },
 982   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 983     CPU_SSE2_FLAGS, 0 },
 984   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 985     CPU_SSE3_FLAGS, 0 },
 986   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 987     CPU_SSSE3_FLAGS, 0 },
 988   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 989     CPU_SSE4_1_FLAGS, 0 },
 990   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 991     CPU_SSE4_2_FLAGS, 0 },
 992   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 993     CPU_SSE4_2_FLAGS, 0 },
 994   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 995     CPU_AVX_FLAGS, 0 },
 996   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 997     CPU_AVX2_FLAGS, 0 },
 998   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 999     CPU_AVX512F_FLAGS, 0 },
1000   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1001     CPU_AVX512CD_FLAGS, 0 },
1002   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1003     CPU_AVX512ER_FLAGS, 0 },
1004   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1005     CPU_AVX512PF_FLAGS, 0 },
1006   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1007     CPU_AVX512DQ_FLAGS, 0 },
1008   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1009     CPU_AVX512BW_FLAGS, 0 },
1010   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1011     CPU_AVX512VL_FLAGS, 0 },
1012   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1013     CPU_VMX_FLAGS, 0 },
1014   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1015     CPU_VMFUNC_FLAGS, 0 },
1016   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1017     CPU_SMX_FLAGS, 0 },
1018   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1019     CPU_XSAVE_FLAGS, 0 },
1020   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1021     CPU_XSAVEOPT_FLAGS, 0 },
1022   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1023     CPU_XSAVEC_FLAGS, 0 },
1024   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1025     CPU_XSAVES_FLAGS, 0 },
1026   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1027     CPU_AES_FLAGS, 0 },
1028   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1029     CPU_PCLMUL_FLAGS, 0 },
1030   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1031     CPU_PCLMUL_FLAGS, 1 },
1032   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1033     CPU_FSGSBASE_FLAGS, 0 },
1034   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1035     CPU_RDRND_FLAGS, 0 },
1036   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1037     CPU_F16C_FLAGS, 0 },
1038   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1039     CPU_BMI2_FLAGS, 0 },
1040   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1041     CPU_FMA_FLAGS, 0 },
1042   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1043     CPU_FMA4_FLAGS, 0 },
1044   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1045     CPU_XOP_FLAGS, 0 },
1046   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1047     CPU_LWP_FLAGS, 0 },
1048   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1049     CPU_MOVBE_FLAGS, 0 },
1050   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1051     CPU_CX16_FLAGS, 0 },
1052   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1053     CPU_EPT_FLAGS, 0 },
1054   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1055     CPU_LZCNT_FLAGS, 0 },
1056   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1057     CPU_HLE_FLAGS, 0 },
1058   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1059     CPU_RTM_FLAGS, 0 },
1060   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1061     CPU_INVPCID_FLAGS, 0 },
1062   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1063     CPU_CLFLUSH_FLAGS, 0 },
1064   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1065     CPU_NOP_FLAGS, 0 },
1066   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1067     CPU_SYSCALL_FLAGS, 0 },
1068   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1069     CPU_RDTSCP_FLAGS, 0 },
1070   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1071     CPU_3DNOW_FLAGS, 0 },
1072   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1073     CPU_3DNOWA_FLAGS, 0 },
1074   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1075     CPU_PADLOCK_FLAGS, 0 },
1076   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1077     CPU_SVME_FLAGS, 1 },
1078   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1079     CPU_SVME_FLAGS, 0 },
1080   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1081     CPU_SSE4A_FLAGS, 0 },
1082   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1083     CPU_ABM_FLAGS, 0 },
1084   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1085     CPU_BMI_FLAGS, 0 },
1086   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1087     CPU_TBM_FLAGS, 0 },
1088   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1089     CPU_ADX_FLAGS, 0 },
1090   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1091     CPU_RDSEED_FLAGS, 0 },
1092   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1093     CPU_PRFCHW_FLAGS, 0 },
1094   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1095     CPU_SMAP_FLAGS, 0 },
1096   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1097     CPU_MPX_FLAGS, 0 },
1098   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1099     CPU_SHA_FLAGS, 0 },
1100   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1101     CPU_CLFLUSHOPT_FLAGS, 0 },
1102   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1103     CPU_PREFETCHWT1_FLAGS, 0 },
1104   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1105     CPU_SE1_FLAGS, 0 },
1106   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1107     CPU_CLWB_FLAGS, 0 },
1108   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1109     CPU_AVX512IFMA_FLAGS, 0 },
1110   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1111     CPU_AVX512VBMI_FLAGS, 0 },
1112   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1113     CPU_AVX512_4FMAPS_FLAGS, 0 },
1114   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1115     CPU_AVX512_4VNNIW_FLAGS, 0 },
1116   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1117     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1118   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1119     CPU_AVX512_VBMI2_FLAGS, 0 },
1120   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1121     CPU_AVX512_VNNI_FLAGS, 0 },
1122   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1123     CPU_AVX512_BITALG_FLAGS, 0 },
1124   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1125     CPU_CLZERO_FLAGS, 0 },
1126   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1127     CPU_MWAITX_FLAGS, 0 },
1128   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1129     CPU_OSPKE_FLAGS, 0 },
1130   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1131     CPU_RDPID_FLAGS, 0 },
1132   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1133     CPU_PTWRITE_FLAGS, 0 },
1134   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1135     CPU_IBT_FLAGS, 0 },
1136   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1137     CPU_SHSTK_FLAGS, 0 },
1138   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1139     CPU_GFNI_FLAGS, 0 },
1140   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1141     CPU_VAES_FLAGS, 0 },
1142   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1143     CPU_VPCLMULQDQ_FLAGS, 0 },
1144   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1145     CPU_WBNOINVD_FLAGS, 0 },
1146   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1147     CPU_PCONFIG_FLAGS, 0 },
1148   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1149     CPU_WAITPKG_FLAGS, 0 },
1150   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1151     CPU_CLDEMOTE_FLAGS, 0 },
1152   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1153     CPU_MOVDIRI_FLAGS, 0 },
1154   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1155     CPU_MOVDIR64B_FLAGS, 0 },
1156   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1157     CPU_AVX512_BF16_FLAGS, 0 },
1158   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1159     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1160   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1161     CPU_ENQCMD_FLAGS, 0 },
1162   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1163     CPU_RDPRU_FLAGS, 0 },
1164   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1165     CPU_MCOMMIT_FLAGS, 0 },
1166 };
1167
1168 static const noarch_entry cpu_noarch[] =
1169 {
1170   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1171   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1172   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1173   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1174   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1175   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1176   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1177   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1178   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1179   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1180   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1181   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1182   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1183   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_FLAGS },
1184   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1185   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1186   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1187   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1188   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1189   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1190   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1191   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1192   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1193   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1194   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1195   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1196   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1197   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1198   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1199   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1200   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1201   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1202   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1203   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1204   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1205   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1206   { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1207   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1208 };
1209
1210 #ifdef I386COFF
1211 /* Like s_lcomm_internal in gas/read.c but the alignment string
1212    is allowed to be optional.  */
1213
1214 static symbolS *
1215 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1216 {
1217   addressT align = 0;
1218
1219   SKIP_WHITESPACE ();
1220
1221   if (needs_align
1222       && *input_line_pointer == ',')
1223     {
1224       align = parse_align (needs_align - 1);
1225
1226       if (align == (addressT) -1)
1227         return NULL;
1228     }
1229   else
1230     {
1231       if (size >= 8)
1232         align = 3;
1233       else if (size >= 4)
1234         align = 2;
1235       else if (size >= 2)
1236         align = 1;
1237       else
1238         align = 0;
1239     }
1240
1241   bss_alloc (symbolP, size, align);
1242   return symbolP;
1243 }
1244
1245 static void
1246 pe_lcomm (int needs_align)
1247 {
1248   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1249 }
1250 #endif
1251
1252 const pseudo_typeS md_pseudo_table[] =
1253 {
1254 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1255   {"align", s_align_bytes, 0},
1256 #else
1257   {"align", s_align_ptwo, 0},
1258 #endif
1259   {"arch", set_cpu_arch, 0},
1260 #ifndef I386COFF
1261   {"bss", s_bss, 0},
1262 #else
1263   {"lcomm", pe_lcomm, 1},
1264 #endif
1265   {"ffloat", float_cons, 'f'},
1266   {"dfloat", float_cons, 'd'},
1267   {"tfloat", float_cons, 'x'},
1268   {"value", cons, 2},
1269   {"slong", signed_cons, 4},
1270   {"noopt", s_ignore, 0},
1271   {"optim", s_ignore, 0},
1272   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1273   {"code16", set_code_flag, CODE_16BIT},
1274   {"code32", set_code_flag, CODE_32BIT},
1275 #ifdef BFD64
1276   {"code64", set_code_flag, CODE_64BIT},
1277 #endif
1278   {"intel_syntax", set_intel_syntax, 1},
1279   {"att_syntax", set_intel_syntax, 0},
1280   {"intel_mnemonic", set_intel_mnemonic, 1},
1281   {"att_mnemonic", set_intel_mnemonic, 0},
1282   {"allow_index_reg", set_allow_index_reg, 1},
1283   {"disallow_index_reg", set_allow_index_reg, 0},
1284   {"sse_check", set_check, 0},
1285   {"operand_check", set_check, 1},
1286 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1287   {"largecomm", handle_large_common, 0},
1288 #else
1289   {"file", dwarf2_directive_file, 0},
1290   {"loc", dwarf2_directive_loc, 0},
1291   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1292 #endif
1293 #ifdef TE_PE
1294   {"secrel32", pe_directive_secrel, 0},
1295 #endif
1296   {0, 0, 0}
1297 };
1298
1299 /* For interface with expression ().  */
1300 extern char *input_line_pointer;
1301
1302 /* Hash table for instruction mnemonic lookup.  */
1303 static struct hash_control *op_hash;
1304
1305 /* Hash table for register lookup.  */
1306 static struct hash_control *reg_hash;
1307 \f
1308   /* Various efficient no-op patterns for aligning code labels.
1309      Note: Don't try to assemble the instructions in the comments.
1310      0L and 0w are not legal.  */
1311 static const unsigned char f32_1[] =
1312   {0x90};                               /* nop                  */
1313 static const unsigned char f32_2[] =
1314   {0x66,0x90};                          /* xchg %ax,%ax         */
1315 static const unsigned char f32_3[] =
1316   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1317 static const unsigned char f32_4[] =
1318   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1319 static const unsigned char f32_6[] =
1320   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1321 static const unsigned char f32_7[] =
1322   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1323 static const unsigned char f16_3[] =
1324   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1325 static const unsigned char f16_4[] =
1326   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1327 static const unsigned char jump_disp8[] =
1328   {0xeb};                               /* jmp disp8           */
1329 static const unsigned char jump32_disp32[] =
1330   {0xe9};                               /* jmp disp32          */
1331 static const unsigned char jump16_disp32[] =
1332   {0x66,0xe9};                          /* jmp disp32          */
1333 /* 32-bit NOPs patterns.  */
1334 static const unsigned char *const f32_patt[] = {
1335   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1336 };
1337 /* 16-bit NOPs patterns.  */
1338 static const unsigned char *const f16_patt[] = {
1339   f32_1, f32_2, f16_3, f16_4
1340 };
1341 /* nopl (%[re]ax) */
1342 static const unsigned char alt_3[] =
1343   {0x0f,0x1f,0x00};
1344 /* nopl 0(%[re]ax) */
1345 static const unsigned char alt_4[] =
1346   {0x0f,0x1f,0x40,0x00};
1347 /* nopl 0(%[re]ax,%[re]ax,1) */
1348 static const unsigned char alt_5[] =
1349   {0x0f,0x1f,0x44,0x00,0x00};
1350 /* nopw 0(%[re]ax,%[re]ax,1) */
1351 static const unsigned char alt_6[] =
1352   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1353 /* nopl 0L(%[re]ax) */
1354 static const unsigned char alt_7[] =
1355   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1356 /* nopl 0L(%[re]ax,%[re]ax,1) */
1357 static const unsigned char alt_8[] =
1358   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1359 /* nopw 0L(%[re]ax,%[re]ax,1) */
1360 static const unsigned char alt_9[] =
1361   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1362 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1363 static const unsigned char alt_10[] =
1364   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1365 /* data16 nopw %cs:0L(%eax,%eax,1) */
1366 static const unsigned char alt_11[] =
1367   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1368 /* 32-bit and 64-bit NOPs patterns.  */
1369 static const unsigned char *const alt_patt[] = {
1370   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1371   alt_9, alt_10, alt_11
1372 };
1373
1374 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1375    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1376
1377 static void
1378 i386_output_nops (char *where, const unsigned char *const *patt,
1379                   int count, int max_single_nop_size)
1380
1381 {
1382   /* Place the longer NOP first.  */
1383   int last;
1384   int offset;
1385   const unsigned char *nops;
1386
1387   if (max_single_nop_size < 1)
1388     {
1389       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1390                 max_single_nop_size);
1391       return;
1392     }
1393
1394   nops = patt[max_single_nop_size - 1];
1395
1396   /* Use the smaller one if the requsted one isn't available.  */
1397   if (nops == NULL)
1398     {
1399       max_single_nop_size--;
1400       nops = patt[max_single_nop_size - 1];
1401     }
1402
1403   last = count % max_single_nop_size;
1404
1405   count -= last;
1406   for (offset = 0; offset < count; offset += max_single_nop_size)
1407     memcpy (where + offset, nops, max_single_nop_size);
1408
1409   if (last)
1410     {
1411       nops = patt[last - 1];
1412       if (nops == NULL)
1413         {
1414           /* Use the smaller one plus one-byte NOP if the needed one
1415              isn't available.  */
1416           last--;
1417           nops = patt[last - 1];
1418           memcpy (where + offset, nops, last);
1419           where[offset + last] = *patt[0];
1420         }
1421       else
1422         memcpy (where + offset, nops, last);
1423     }
1424 }
1425
1426 static INLINE int
1427 fits_in_imm7 (offsetT num)
1428 {
1429   return (num & 0x7f) == num;
1430 }
1431
1432 static INLINE int
1433 fits_in_imm31 (offsetT num)
1434 {
1435   return (num & 0x7fffffff) == num;
1436 }
1437
1438 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1439    single NOP instruction LIMIT.  */
1440
1441 void
1442 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1443 {
1444   const unsigned char *const *patt = NULL;
1445   int max_single_nop_size;
1446   /* Maximum number of NOPs before switching to jump over NOPs.  */
1447   int max_number_of_nops;
1448
1449   switch (fragP->fr_type)
1450     {
1451     case rs_fill_nop:
1452     case rs_align_code:
1453       break;
1454     case rs_machine_dependent:
1455       /* Allow NOP padding for jumps and calls.  */
1456       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1457           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1458         break;
1459       /* Fall through.  */
1460     default:
1461       return;
1462     }
1463
1464   /* We need to decide which NOP sequence to use for 32bit and
1465      64bit. When -mtune= is used:
1466
1467      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1468      PROCESSOR_GENERIC32, f32_patt will be used.
1469      2. For the rest, alt_patt will be used.
1470
1471      When -mtune= isn't used, alt_patt will be used if
1472      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1473      be used.
1474
1475      When -march= or .arch is used, we can't use anything beyond
1476      cpu_arch_isa_flags.   */
1477
1478   if (flag_code == CODE_16BIT)
1479     {
1480       patt = f16_patt;
1481       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1482       /* Limit number of NOPs to 2 in 16-bit mode.  */
1483       max_number_of_nops = 2;
1484     }
1485   else
1486     {
1487       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1488         {
1489           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1490           switch (cpu_arch_tune)
1491             {
1492             case PROCESSOR_UNKNOWN:
1493               /* We use cpu_arch_isa_flags to check if we SHOULD
1494                  optimize with nops.  */
1495               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1496                 patt = alt_patt;
1497               else
1498                 patt = f32_patt;
1499               break;
1500             case PROCESSOR_PENTIUM4:
1501             case PROCESSOR_NOCONA:
1502             case PROCESSOR_CORE:
1503             case PROCESSOR_CORE2:
1504             case PROCESSOR_COREI7:
1505             case PROCESSOR_L1OM:
1506             case PROCESSOR_K1OM:
1507             case PROCESSOR_GENERIC64:
1508             case PROCESSOR_K6:
1509             case PROCESSOR_ATHLON:
1510             case PROCESSOR_K8:
1511             case PROCESSOR_AMDFAM10:
1512             case PROCESSOR_BD:
1513             case PROCESSOR_ZNVER:
1514             case PROCESSOR_BT:
1515               patt = alt_patt;
1516               break;
1517             case PROCESSOR_I386:
1518             case PROCESSOR_I486:
1519             case PROCESSOR_PENTIUM:
1520             case PROCESSOR_PENTIUMPRO:
1521             case PROCESSOR_IAMCU:
1522             case PROCESSOR_GENERIC32:
1523               patt = f32_patt;
1524               break;
1525             }
1526         }
1527       else
1528         {
1529           switch (fragP->tc_frag_data.tune)
1530             {
1531             case PROCESSOR_UNKNOWN:
1532               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1533                  PROCESSOR_UNKNOWN.  */
1534               abort ();
1535               break;
1536
1537             case PROCESSOR_I386:
1538             case PROCESSOR_I486:
1539             case PROCESSOR_PENTIUM:
1540             case PROCESSOR_IAMCU:
1541             case PROCESSOR_K6:
1542             case PROCESSOR_ATHLON:
1543             case PROCESSOR_K8:
1544             case PROCESSOR_AMDFAM10:
1545             case PROCESSOR_BD:
1546             case PROCESSOR_ZNVER:
1547             case PROCESSOR_BT:
1548             case PROCESSOR_GENERIC32:
1549               /* We use cpu_arch_isa_flags to check if we CAN optimize
1550                  with nops.  */
1551               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1552                 patt = alt_patt;
1553               else
1554                 patt = f32_patt;
1555               break;
1556             case PROCESSOR_PENTIUMPRO:
1557             case PROCESSOR_PENTIUM4:
1558             case PROCESSOR_NOCONA:
1559             case PROCESSOR_CORE:
1560             case PROCESSOR_CORE2:
1561             case PROCESSOR_COREI7:
1562             case PROCESSOR_L1OM:
1563             case PROCESSOR_K1OM:
1564               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1565                 patt = alt_patt;
1566               else
1567                 patt = f32_patt;
1568               break;
1569             case PROCESSOR_GENERIC64:
1570               patt = alt_patt;
1571               break;
1572             }
1573         }
1574
1575       if (patt == f32_patt)
1576         {
1577           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1578           /* Limit number of NOPs to 2 for older processors.  */
1579           max_number_of_nops = 2;
1580         }
1581       else
1582         {
1583           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1584           /* Limit number of NOPs to 7 for newer processors.  */
1585           max_number_of_nops = 7;
1586         }
1587     }
1588
1589   if (limit == 0)
1590     limit = max_single_nop_size;
1591
1592   if (fragP->fr_type == rs_fill_nop)
1593     {
1594       /* Output NOPs for .nop directive.  */
1595       if (limit > max_single_nop_size)
1596         {
1597           as_bad_where (fragP->fr_file, fragP->fr_line,
1598                         _("invalid single nop size: %d "
1599                           "(expect within [0, %d])"),
1600                         limit, max_single_nop_size);
1601           return;
1602         }
1603     }
1604   else if (fragP->fr_type != rs_machine_dependent)
1605     fragP->fr_var = count;
1606
1607   if ((count / max_single_nop_size) > max_number_of_nops)
1608     {
1609       /* Generate jump over NOPs.  */
1610       offsetT disp = count - 2;
1611       if (fits_in_imm7 (disp))
1612         {
1613           /* Use "jmp disp8" if possible.  */
1614           count = disp;
1615           where[0] = jump_disp8[0];
1616           where[1] = count;
1617           where += 2;
1618         }
1619       else
1620         {
1621           unsigned int size_of_jump;
1622
1623           if (flag_code == CODE_16BIT)
1624             {
1625               where[0] = jump16_disp32[0];
1626               where[1] = jump16_disp32[1];
1627               size_of_jump = 2;
1628             }
1629           else
1630             {
1631               where[0] = jump32_disp32[0];
1632               size_of_jump = 1;
1633             }
1634
1635           count -= size_of_jump + 4;
1636           if (!fits_in_imm31 (count))
1637             {
1638               as_bad_where (fragP->fr_file, fragP->fr_line,
1639                             _("jump over nop padding out of range"));
1640               return;
1641             }
1642
1643           md_number_to_chars (where + size_of_jump, count, 4);
1644           where += size_of_jump + 4;
1645         }
1646     }
1647
1648   /* Generate multiple NOPs.  */
1649   i386_output_nops (where, patt, count, limit);
1650 }
1651
1652 static INLINE int
1653 operand_type_all_zero (const union i386_operand_type *x)
1654 {
1655   switch (ARRAY_SIZE(x->array))
1656     {
1657     case 3:
1658       if (x->array[2])
1659         return 0;
1660       /* Fall through.  */
1661     case 2:
1662       if (x->array[1])
1663         return 0;
1664       /* Fall through.  */
1665     case 1:
1666       return !x->array[0];
1667     default:
1668       abort ();
1669     }
1670 }
1671
1672 static INLINE void
1673 operand_type_set (union i386_operand_type *x, unsigned int v)
1674 {
1675   switch (ARRAY_SIZE(x->array))
1676     {
1677     case 3:
1678       x->array[2] = v;
1679       /* Fall through.  */
1680     case 2:
1681       x->array[1] = v;
1682       /* Fall through.  */
1683     case 1:
1684       x->array[0] = v;
1685       /* Fall through.  */
1686       break;
1687     default:
1688       abort ();
1689     }
1690
1691   x->bitfield.class = ClassNone;
1692   x->bitfield.instance = InstanceNone;
1693 }
1694
1695 static INLINE int
1696 operand_type_equal (const union i386_operand_type *x,
1697                     const union i386_operand_type *y)
1698 {
1699   switch (ARRAY_SIZE(x->array))
1700     {
1701     case 3:
1702       if (x->array[2] != y->array[2])
1703         return 0;
1704       /* Fall through.  */
1705     case 2:
1706       if (x->array[1] != y->array[1])
1707         return 0;
1708       /* Fall through.  */
1709     case 1:
1710       return x->array[0] == y->array[0];
1711       break;
1712     default:
1713       abort ();
1714     }
1715 }
1716
1717 static INLINE int
1718 cpu_flags_all_zero (const union i386_cpu_flags *x)
1719 {
1720   switch (ARRAY_SIZE(x->array))
1721     {
1722     case 4:
1723       if (x->array[3])
1724         return 0;
1725       /* Fall through.  */
1726     case 3:
1727       if (x->array[2])
1728         return 0;
1729       /* Fall through.  */
1730     case 2:
1731       if (x->array[1])
1732         return 0;
1733       /* Fall through.  */
1734     case 1:
1735       return !x->array[0];
1736     default:
1737       abort ();
1738     }
1739 }
1740
1741 static INLINE int
1742 cpu_flags_equal (const union i386_cpu_flags *x,
1743                  const union i386_cpu_flags *y)
1744 {
1745   switch (ARRAY_SIZE(x->array))
1746     {
1747     case 4:
1748       if (x->array[3] != y->array[3])
1749         return 0;
1750       /* Fall through.  */
1751     case 3:
1752       if (x->array[2] != y->array[2])
1753         return 0;
1754       /* Fall through.  */
1755     case 2:
1756       if (x->array[1] != y->array[1])
1757         return 0;
1758       /* Fall through.  */
1759     case 1:
1760       return x->array[0] == y->array[0];
1761       break;
1762     default:
1763       abort ();
1764     }
1765 }
1766
1767 static INLINE int
1768 cpu_flags_check_cpu64 (i386_cpu_flags f)
1769 {
1770   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1771            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1772 }
1773
1774 static INLINE i386_cpu_flags
1775 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1776 {
1777   switch (ARRAY_SIZE (x.array))
1778     {
1779     case 4:
1780       x.array [3] &= y.array [3];
1781       /* Fall through.  */
1782     case 3:
1783       x.array [2] &= y.array [2];
1784       /* Fall through.  */
1785     case 2:
1786       x.array [1] &= y.array [1];
1787       /* Fall through.  */
1788     case 1:
1789       x.array [0] &= y.array [0];
1790       break;
1791     default:
1792       abort ();
1793     }
1794   return x;
1795 }
1796
1797 static INLINE i386_cpu_flags
1798 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1799 {
1800   switch (ARRAY_SIZE (x.array))
1801     {
1802     case 4:
1803       x.array [3] |= y.array [3];
1804       /* Fall through.  */
1805     case 3:
1806       x.array [2] |= y.array [2];
1807       /* Fall through.  */
1808     case 2:
1809       x.array [1] |= y.array [1];
1810       /* Fall through.  */
1811     case 1:
1812       x.array [0] |= y.array [0];
1813       break;
1814     default:
1815       abort ();
1816     }
1817   return x;
1818 }
1819
1820 static INLINE i386_cpu_flags
1821 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1822 {
1823   switch (ARRAY_SIZE (x.array))
1824     {
1825     case 4:
1826       x.array [3] &= ~y.array [3];
1827       /* Fall through.  */
1828     case 3:
1829       x.array [2] &= ~y.array [2];
1830       /* Fall through.  */
1831     case 2:
1832       x.array [1] &= ~y.array [1];
1833       /* Fall through.  */
1834     case 1:
1835       x.array [0] &= ~y.array [0];
1836       break;
1837     default:
1838       abort ();
1839     }
1840   return x;
1841 }
1842
1843 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1844
1845 #define CPU_FLAGS_ARCH_MATCH            0x1
1846 #define CPU_FLAGS_64BIT_MATCH           0x2
1847
1848 #define CPU_FLAGS_PERFECT_MATCH \
1849   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1850
1851 /* Return CPU flags match bits. */
1852
1853 static int
1854 cpu_flags_match (const insn_template *t)
1855 {
1856   i386_cpu_flags x = t->cpu_flags;
1857   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1858
1859   x.bitfield.cpu64 = 0;
1860   x.bitfield.cpuno64 = 0;
1861
1862   if (cpu_flags_all_zero (&x))
1863     {
1864       /* This instruction is available on all archs.  */
1865       match |= CPU_FLAGS_ARCH_MATCH;
1866     }
1867   else
1868     {
1869       /* This instruction is available only on some archs.  */
1870       i386_cpu_flags cpu = cpu_arch_flags;
1871
1872       /* AVX512VL is no standalone feature - match it and then strip it.  */
1873       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1874         return match;
1875       x.bitfield.cpuavx512vl = 0;
1876
1877       cpu = cpu_flags_and (x, cpu);
1878       if (!cpu_flags_all_zero (&cpu))
1879         {
1880           if (x.bitfield.cpuavx)
1881             {
1882               /* We need to check a few extra flags with AVX.  */
1883               if (cpu.bitfield.cpuavx
1884                   && (!t->opcode_modifier.sse2avx || sse2avx)
1885                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1886                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1887                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1888                 match |= CPU_FLAGS_ARCH_MATCH;
1889             }
1890           else if (x.bitfield.cpuavx512f)
1891             {
1892               /* We need to check a few extra flags with AVX512F.  */
1893               if (cpu.bitfield.cpuavx512f
1894                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1895                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1896                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1897                 match |= CPU_FLAGS_ARCH_MATCH;
1898             }
1899           else
1900             match |= CPU_FLAGS_ARCH_MATCH;
1901         }
1902     }
1903   return match;
1904 }
1905
1906 static INLINE i386_operand_type
1907 operand_type_and (i386_operand_type x, i386_operand_type y)
1908 {
1909   if (x.bitfield.class != y.bitfield.class)
1910     x.bitfield.class = ClassNone;
1911   if (x.bitfield.instance != y.bitfield.instance)
1912     x.bitfield.instance = InstanceNone;
1913
1914   switch (ARRAY_SIZE (x.array))
1915     {
1916     case 3:
1917       x.array [2] &= y.array [2];
1918       /* Fall through.  */
1919     case 2:
1920       x.array [1] &= y.array [1];
1921       /* Fall through.  */
1922     case 1:
1923       x.array [0] &= y.array [0];
1924       break;
1925     default:
1926       abort ();
1927     }
1928   return x;
1929 }
1930
1931 static INLINE i386_operand_type
1932 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1933 {
1934   gas_assert (y.bitfield.class == ClassNone);
1935   gas_assert (y.bitfield.instance == InstanceNone);
1936
1937   switch (ARRAY_SIZE (x.array))
1938     {
1939     case 3:
1940       x.array [2] &= ~y.array [2];
1941       /* Fall through.  */
1942     case 2:
1943       x.array [1] &= ~y.array [1];
1944       /* Fall through.  */
1945     case 1:
1946       x.array [0] &= ~y.array [0];
1947       break;
1948     default:
1949       abort ();
1950     }
1951   return x;
1952 }
1953
1954 static INLINE i386_operand_type
1955 operand_type_or (i386_operand_type x, i386_operand_type y)
1956 {
1957   gas_assert (x.bitfield.class == ClassNone ||
1958               y.bitfield.class == ClassNone ||
1959               x.bitfield.class == y.bitfield.class);
1960   gas_assert (x.bitfield.instance == InstanceNone ||
1961               y.bitfield.instance == InstanceNone ||
1962               x.bitfield.instance == y.bitfield.instance);
1963
1964   switch (ARRAY_SIZE (x.array))
1965     {
1966     case 3:
1967       x.array [2] |= y.array [2];
1968       /* Fall through.  */
1969     case 2:
1970       x.array [1] |= y.array [1];
1971       /* Fall through.  */
1972     case 1:
1973       x.array [0] |= y.array [0];
1974       break;
1975     default:
1976       abort ();
1977     }
1978   return x;
1979 }
1980
1981 static INLINE i386_operand_type
1982 operand_type_xor (i386_operand_type x, i386_operand_type y)
1983 {
1984   gas_assert (y.bitfield.class == ClassNone);
1985   gas_assert (y.bitfield.instance == InstanceNone);
1986
1987   switch (ARRAY_SIZE (x.array))
1988     {
1989     case 3:
1990       x.array [2] ^= y.array [2];
1991       /* Fall through.  */
1992     case 2:
1993       x.array [1] ^= y.array [1];
1994       /* Fall through.  */
1995     case 1:
1996       x.array [0] ^= y.array [0];
1997       break;
1998     default:
1999       abort ();
2000     }
2001   return x;
2002 }
2003
2004 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2005 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2006 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2007 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2008 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2009 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2010 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2011 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2012 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2013 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2014 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2015 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2016 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2017 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2018 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2019 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2020 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2021
2022 enum operand_type
2023 {
2024   reg,
2025   imm,
2026   disp,
2027   anymem
2028 };
2029
2030 static INLINE int
2031 operand_type_check (i386_operand_type t, enum operand_type c)
2032 {
2033   switch (c)
2034     {
2035     case reg:
2036       return t.bitfield.class == Reg;
2037
2038     case imm:
2039       return (t.bitfield.imm8
2040               || t.bitfield.imm8s
2041               || t.bitfield.imm16
2042               || t.bitfield.imm32
2043               || t.bitfield.imm32s
2044               || t.bitfield.imm64);
2045
2046     case disp:
2047       return (t.bitfield.disp8
2048               || t.bitfield.disp16
2049               || t.bitfield.disp32
2050               || t.bitfield.disp32s
2051               || t.bitfield.disp64);
2052
2053     case anymem:
2054       return (t.bitfield.disp8
2055               || t.bitfield.disp16
2056               || t.bitfield.disp32
2057               || t.bitfield.disp32s
2058               || t.bitfield.disp64
2059               || t.bitfield.baseindex);
2060
2061     default:
2062       abort ();
2063     }
2064
2065   return 0;
2066 }
2067
2068 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2069    between operand GIVEN and opeand WANTED for instruction template T.  */
2070
2071 static INLINE int
2072 match_operand_size (const insn_template *t, unsigned int wanted,
2073                     unsigned int given)
2074 {
2075   return !((i.types[given].bitfield.byte
2076             && !t->operand_types[wanted].bitfield.byte)
2077            || (i.types[given].bitfield.word
2078                && !t->operand_types[wanted].bitfield.word)
2079            || (i.types[given].bitfield.dword
2080                && !t->operand_types[wanted].bitfield.dword)
2081            || (i.types[given].bitfield.qword
2082                && !t->operand_types[wanted].bitfield.qword)
2083            || (i.types[given].bitfield.tbyte
2084                && !t->operand_types[wanted].bitfield.tbyte));
2085 }
2086
2087 /* Return 1 if there is no conflict in SIMD register between operand
2088    GIVEN and opeand WANTED for instruction template T.  */
2089
2090 static INLINE int
2091 match_simd_size (const insn_template *t, unsigned int wanted,
2092                  unsigned int given)
2093 {
2094   return !((i.types[given].bitfield.xmmword
2095             && !t->operand_types[wanted].bitfield.xmmword)
2096            || (i.types[given].bitfield.ymmword
2097                && !t->operand_types[wanted].bitfield.ymmword)
2098            || (i.types[given].bitfield.zmmword
2099                && !t->operand_types[wanted].bitfield.zmmword));
2100 }
2101
2102 /* Return 1 if there is no conflict in any size between operand GIVEN
2103    and opeand WANTED for instruction template T.  */
2104
2105 static INLINE int
2106 match_mem_size (const insn_template *t, unsigned int wanted,
2107                 unsigned int given)
2108 {
2109   return (match_operand_size (t, wanted, given)
2110           && !((i.types[given].bitfield.unspecified
2111                 && !i.broadcast
2112                 && !t->operand_types[wanted].bitfield.unspecified)
2113                || (i.types[given].bitfield.fword
2114                    && !t->operand_types[wanted].bitfield.fword)
2115                /* For scalar opcode templates to allow register and memory
2116                   operands at the same time, some special casing is needed
2117                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2118                   down-conversion vpmov*.  */
2119                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2120                     && !t->opcode_modifier.broadcast
2121                     && (t->operand_types[wanted].bitfield.byte
2122                         || t->operand_types[wanted].bitfield.word
2123                         || t->operand_types[wanted].bitfield.dword
2124                         || t->operand_types[wanted].bitfield.qword))
2125                    ? (i.types[given].bitfield.xmmword
2126                       || i.types[given].bitfield.ymmword
2127                       || i.types[given].bitfield.zmmword)
2128                    : !match_simd_size(t, wanted, given))));
2129 }
2130
2131 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2132    operands for instruction template T, and it has MATCH_REVERSE set if there
2133    is no size conflict on any operands for the template with operands reversed
2134    (and the template allows for reversing in the first place).  */
2135
2136 #define MATCH_STRAIGHT 1
2137 #define MATCH_REVERSE  2
2138
2139 static INLINE unsigned int
2140 operand_size_match (const insn_template *t)
2141 {
2142   unsigned int j, match = MATCH_STRAIGHT;
2143
2144   /* Don't check non-absolute jump instructions.  */
2145   if (t->opcode_modifier.jump
2146       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2147     return match;
2148
2149   /* Check memory and accumulator operand size.  */
2150   for (j = 0; j < i.operands; j++)
2151     {
2152       if (i.types[j].bitfield.class != Reg
2153           && i.types[j].bitfield.class != RegSIMD
2154           && t->opcode_modifier.anysize)
2155         continue;
2156
2157       if (t->operand_types[j].bitfield.class == Reg
2158           && !match_operand_size (t, j, j))
2159         {
2160           match = 0;
2161           break;
2162         }
2163
2164       if (t->operand_types[j].bitfield.class == RegSIMD
2165           && !match_simd_size (t, j, j))
2166         {
2167           match = 0;
2168           break;
2169         }
2170
2171       if (t->operand_types[j].bitfield.instance == Accum
2172           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2173         {
2174           match = 0;
2175           break;
2176         }
2177
2178       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2179         {
2180           match = 0;
2181           break;
2182         }
2183     }
2184
2185   if (!t->opcode_modifier.d)
2186     {
2187 mismatch:
2188       if (!match)
2189         i.error = operand_size_mismatch;
2190       return match;
2191     }
2192
2193   /* Check reverse.  */
2194   gas_assert (i.operands >= 2 && i.operands <= 3);
2195
2196   for (j = 0; j < i.operands; j++)
2197     {
2198       unsigned int given = i.operands - j - 1;
2199
2200       if (t->operand_types[j].bitfield.class == Reg
2201           && !match_operand_size (t, j, given))
2202         goto mismatch;
2203
2204       if (t->operand_types[j].bitfield.class == RegSIMD
2205           && !match_simd_size (t, j, given))
2206         goto mismatch;
2207
2208       if (t->operand_types[j].bitfield.instance == Accum
2209           && (!match_operand_size (t, j, given)
2210               || !match_simd_size (t, j, given)))
2211         goto mismatch;
2212
2213       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2214         goto mismatch;
2215     }
2216
2217   return match | MATCH_REVERSE;
2218 }
2219
2220 static INLINE int
2221 operand_type_match (i386_operand_type overlap,
2222                     i386_operand_type given)
2223 {
2224   i386_operand_type temp = overlap;
2225
2226   temp.bitfield.unspecified = 0;
2227   temp.bitfield.byte = 0;
2228   temp.bitfield.word = 0;
2229   temp.bitfield.dword = 0;
2230   temp.bitfield.fword = 0;
2231   temp.bitfield.qword = 0;
2232   temp.bitfield.tbyte = 0;
2233   temp.bitfield.xmmword = 0;
2234   temp.bitfield.ymmword = 0;
2235   temp.bitfield.zmmword = 0;
2236   if (operand_type_all_zero (&temp))
2237     goto mismatch;
2238
2239   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2240     return 1;
2241
2242 mismatch:
2243   i.error = operand_type_mismatch;
2244   return 0;
2245 }
2246
2247 /* If given types g0 and g1 are registers they must be of the same type
2248    unless the expected operand type register overlap is null.
2249    Some Intel syntax memory operand size checking also happens here.  */
2250
2251 static INLINE int
2252 operand_type_register_match (i386_operand_type g0,
2253                              i386_operand_type t0,
2254                              i386_operand_type g1,
2255                              i386_operand_type t1)
2256 {
2257   if (g0.bitfield.class != Reg
2258       && g0.bitfield.class != RegSIMD
2259       && (!operand_type_check (g0, anymem)
2260           || g0.bitfield.unspecified
2261           || (t0.bitfield.class != Reg
2262               && t0.bitfield.class != RegSIMD)))
2263     return 1;
2264
2265   if (g1.bitfield.class != Reg
2266       && g1.bitfield.class != RegSIMD
2267       && (!operand_type_check (g1, anymem)
2268           || g1.bitfield.unspecified
2269           || (t1.bitfield.class != Reg
2270               && t1.bitfield.class != RegSIMD)))
2271     return 1;
2272
2273   if (g0.bitfield.byte == g1.bitfield.byte
2274       && g0.bitfield.word == g1.bitfield.word
2275       && g0.bitfield.dword == g1.bitfield.dword
2276       && g0.bitfield.qword == g1.bitfield.qword
2277       && g0.bitfield.xmmword == g1.bitfield.xmmword
2278       && g0.bitfield.ymmword == g1.bitfield.ymmword
2279       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2280     return 1;
2281
2282   if (!(t0.bitfield.byte & t1.bitfield.byte)
2283       && !(t0.bitfield.word & t1.bitfield.word)
2284       && !(t0.bitfield.dword & t1.bitfield.dword)
2285       && !(t0.bitfield.qword & t1.bitfield.qword)
2286       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2287       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2288       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2289     return 1;
2290
2291   i.error = register_type_mismatch;
2292
2293   return 0;
2294 }
2295
2296 static INLINE unsigned int
2297 register_number (const reg_entry *r)
2298 {
2299   unsigned int nr = r->reg_num;
2300
2301   if (r->reg_flags & RegRex)
2302     nr += 8;
2303
2304   if (r->reg_flags & RegVRex)
2305     nr += 16;
2306
2307   return nr;
2308 }
2309
2310 static INLINE unsigned int
2311 mode_from_disp_size (i386_operand_type t)
2312 {
2313   if (t.bitfield.disp8)
2314     return 1;
2315   else if (t.bitfield.disp16
2316            || t.bitfield.disp32
2317            || t.bitfield.disp32s)
2318     return 2;
2319   else
2320     return 0;
2321 }
2322
2323 static INLINE int
2324 fits_in_signed_byte (addressT num)
2325 {
2326   return num + 0x80 <= 0xff;
2327 }
2328
2329 static INLINE int
2330 fits_in_unsigned_byte (addressT num)
2331 {
2332   return num <= 0xff;
2333 }
2334
2335 static INLINE int
2336 fits_in_unsigned_word (addressT num)
2337 {
2338   return num <= 0xffff;
2339 }
2340
2341 static INLINE int
2342 fits_in_signed_word (addressT num)
2343 {
2344   return num + 0x8000 <= 0xffff;
2345 }
2346
2347 static INLINE int
2348 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2349 {
2350 #ifndef BFD64
2351   return 1;
2352 #else
2353   return num + 0x80000000 <= 0xffffffff;
2354 #endif
2355 }                               /* fits_in_signed_long() */
2356
2357 static INLINE int
2358 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2359 {
2360 #ifndef BFD64
2361   return 1;
2362 #else
2363   return num <= 0xffffffff;
2364 #endif
2365 }                               /* fits_in_unsigned_long() */
2366
2367 static INLINE int
2368 fits_in_disp8 (offsetT num)
2369 {
2370   int shift = i.memshift;
2371   unsigned int mask;
2372
2373   if (shift == -1)
2374     abort ();
2375
2376   mask = (1 << shift) - 1;
2377
2378   /* Return 0 if NUM isn't properly aligned.  */
2379   if ((num & mask))
2380     return 0;
2381
2382   /* Check if NUM will fit in 8bit after shift.  */
2383   return fits_in_signed_byte (num >> shift);
2384 }
2385
2386 static INLINE int
2387 fits_in_imm4 (offsetT num)
2388 {
2389   return (num & 0xf) == num;
2390 }
2391
2392 static i386_operand_type
2393 smallest_imm_type (offsetT num)
2394 {
2395   i386_operand_type t;
2396
2397   operand_type_set (&t, 0);
2398   t.bitfield.imm64 = 1;
2399
2400   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2401     {
2402       /* This code is disabled on the 486 because all the Imm1 forms
2403          in the opcode table are slower on the i486.  They're the
2404          versions with the implicitly specified single-position
2405          displacement, which has another syntax if you really want to
2406          use that form.  */
2407       t.bitfield.imm1 = 1;
2408       t.bitfield.imm8 = 1;
2409       t.bitfield.imm8s = 1;
2410       t.bitfield.imm16 = 1;
2411       t.bitfield.imm32 = 1;
2412       t.bitfield.imm32s = 1;
2413     }
2414   else if (fits_in_signed_byte (num))
2415     {
2416       t.bitfield.imm8 = 1;
2417       t.bitfield.imm8s = 1;
2418       t.bitfield.imm16 = 1;
2419       t.bitfield.imm32 = 1;
2420       t.bitfield.imm32s = 1;
2421     }
2422   else if (fits_in_unsigned_byte (num))
2423     {
2424       t.bitfield.imm8 = 1;
2425       t.bitfield.imm16 = 1;
2426       t.bitfield.imm32 = 1;
2427       t.bitfield.imm32s = 1;
2428     }
2429   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2430     {
2431       t.bitfield.imm16 = 1;
2432       t.bitfield.imm32 = 1;
2433       t.bitfield.imm32s = 1;
2434     }
2435   else if (fits_in_signed_long (num))
2436     {
2437       t.bitfield.imm32 = 1;
2438       t.bitfield.imm32s = 1;
2439     }
2440   else if (fits_in_unsigned_long (num))
2441     t.bitfield.imm32 = 1;
2442
2443   return t;
2444 }
2445
2446 static offsetT
2447 offset_in_range (offsetT val, int size)
2448 {
2449   addressT mask;
2450
2451   switch (size)
2452     {
2453     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2454     case 2: mask = ((addressT) 1 << 16) - 1; break;
2455     case 4: mask = ((addressT) 2 << 31) - 1; break;
2456 #ifdef BFD64
2457     case 8: mask = ((addressT) 2 << 63) - 1; break;
2458 #endif
2459     default: abort ();
2460     }
2461
2462 #ifdef BFD64
2463   /* If BFD64, sign extend val for 32bit address mode.  */
2464   if (flag_code != CODE_64BIT
2465       || i.prefix[ADDR_PREFIX])
2466     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2467       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2468 #endif
2469
2470   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2471     {
2472       char buf1[40], buf2[40];
2473
2474       sprint_value (buf1, val);
2475       sprint_value (buf2, val & mask);
2476       as_warn (_("%s shortened to %s"), buf1, buf2);
2477     }
2478   return val & mask;
2479 }
2480
2481 enum PREFIX_GROUP
2482 {
2483   PREFIX_EXIST = 0,
2484   PREFIX_LOCK,
2485   PREFIX_REP,
2486   PREFIX_DS,
2487   PREFIX_OTHER
2488 };
2489
2490 /* Returns
2491    a. PREFIX_EXIST if attempting to add a prefix where one from the
2492    same class already exists.
2493    b. PREFIX_LOCK if lock prefix is added.
2494    c. PREFIX_REP if rep/repne prefix is added.
2495    d. PREFIX_DS if ds prefix is added.
2496    e. PREFIX_OTHER if other prefix is added.
2497  */
2498
2499 static enum PREFIX_GROUP
2500 add_prefix (unsigned int prefix)
2501 {
2502   enum PREFIX_GROUP ret = PREFIX_OTHER;
2503   unsigned int q;
2504
2505   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2506       && flag_code == CODE_64BIT)
2507     {
2508       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2509           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2510           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2511           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2512         ret = PREFIX_EXIST;
2513       q = REX_PREFIX;
2514     }
2515   else
2516     {
2517       switch (prefix)
2518         {
2519         default:
2520           abort ();
2521
2522         case DS_PREFIX_OPCODE:
2523           ret = PREFIX_DS;
2524           /* Fall through.  */
2525         case CS_PREFIX_OPCODE:
2526         case ES_PREFIX_OPCODE:
2527         case FS_PREFIX_OPCODE:
2528         case GS_PREFIX_OPCODE:
2529         case SS_PREFIX_OPCODE:
2530           q = SEG_PREFIX;
2531           break;
2532
2533         case REPNE_PREFIX_OPCODE:
2534         case REPE_PREFIX_OPCODE:
2535           q = REP_PREFIX;
2536           ret = PREFIX_REP;
2537           break;
2538
2539         case LOCK_PREFIX_OPCODE:
2540           q = LOCK_PREFIX;
2541           ret = PREFIX_LOCK;
2542           break;
2543
2544         case FWAIT_OPCODE:
2545           q = WAIT_PREFIX;
2546           break;
2547
2548         case ADDR_PREFIX_OPCODE:
2549           q = ADDR_PREFIX;
2550           break;
2551
2552         case DATA_PREFIX_OPCODE:
2553           q = DATA_PREFIX;
2554           break;
2555         }
2556       if (i.prefix[q] != 0)
2557         ret = PREFIX_EXIST;
2558     }
2559
2560   if (ret)
2561     {
2562       if (!i.prefix[q])
2563         ++i.prefixes;
2564       i.prefix[q] |= prefix;
2565     }
2566   else
2567     as_bad (_("same type of prefix used twice"));
2568
2569   return ret;
2570 }
2571
2572 static void
2573 update_code_flag (int value, int check)
2574 {
2575   PRINTF_LIKE ((*as_error));
2576
2577   flag_code = (enum flag_code) value;
2578   if (flag_code == CODE_64BIT)
2579     {
2580       cpu_arch_flags.bitfield.cpu64 = 1;
2581       cpu_arch_flags.bitfield.cpuno64 = 0;
2582     }
2583   else
2584     {
2585       cpu_arch_flags.bitfield.cpu64 = 0;
2586       cpu_arch_flags.bitfield.cpuno64 = 1;
2587     }
2588   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2589     {
2590       if (check)
2591         as_error = as_fatal;
2592       else
2593         as_error = as_bad;
2594       (*as_error) (_("64bit mode not supported on `%s'."),
2595                    cpu_arch_name ? cpu_arch_name : default_arch);
2596     }
2597   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2598     {
2599       if (check)
2600         as_error = as_fatal;
2601       else
2602         as_error = as_bad;
2603       (*as_error) (_("32bit mode not supported on `%s'."),
2604                    cpu_arch_name ? cpu_arch_name : default_arch);
2605     }
2606   stackop_size = '\0';
2607 }
2608
2609 static void
2610 set_code_flag (int value)
2611 {
2612   update_code_flag (value, 0);
2613 }
2614
2615 static void
2616 set_16bit_gcc_code_flag (int new_code_flag)
2617 {
2618   flag_code = (enum flag_code) new_code_flag;
2619   if (flag_code != CODE_16BIT)
2620     abort ();
2621   cpu_arch_flags.bitfield.cpu64 = 0;
2622   cpu_arch_flags.bitfield.cpuno64 = 1;
2623   stackop_size = LONG_MNEM_SUFFIX;
2624 }
2625
2626 static void
2627 set_intel_syntax (int syntax_flag)
2628 {
2629   /* Find out if register prefixing is specified.  */
2630   int ask_naked_reg = 0;
2631
2632   SKIP_WHITESPACE ();
2633   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2634     {
2635       char *string;
2636       int e = get_symbol_name (&string);
2637
2638       if (strcmp (string, "prefix") == 0)
2639         ask_naked_reg = 1;
2640       else if (strcmp (string, "noprefix") == 0)
2641         ask_naked_reg = -1;
2642       else
2643         as_bad (_("bad argument to syntax directive."));
2644       (void) restore_line_pointer (e);
2645     }
2646   demand_empty_rest_of_line ();
2647
2648   intel_syntax = syntax_flag;
2649
2650   if (ask_naked_reg == 0)
2651     allow_naked_reg = (intel_syntax
2652                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2653   else
2654     allow_naked_reg = (ask_naked_reg < 0);
2655
2656   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2657
2658   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2659   identifier_chars['$'] = intel_syntax ? '$' : 0;
2660   register_prefix = allow_naked_reg ? "" : "%";
2661 }
2662
2663 static void
2664 set_intel_mnemonic (int mnemonic_flag)
2665 {
2666   intel_mnemonic = mnemonic_flag;
2667 }
2668
2669 static void
2670 set_allow_index_reg (int flag)
2671 {
2672   allow_index_reg = flag;
2673 }
2674
2675 static void
2676 set_check (int what)
2677 {
2678   enum check_kind *kind;
2679   const char *str;
2680
2681   if (what)
2682     {
2683       kind = &operand_check;
2684       str = "operand";
2685     }
2686   else
2687     {
2688       kind = &sse_check;
2689       str = "sse";
2690     }
2691
2692   SKIP_WHITESPACE ();
2693
2694   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2695     {
2696       char *string;
2697       int e = get_symbol_name (&string);
2698
2699       if (strcmp (string, "none") == 0)
2700         *kind = check_none;
2701       else if (strcmp (string, "warning") == 0)
2702         *kind = check_warning;
2703       else if (strcmp (string, "error") == 0)
2704         *kind = check_error;
2705       else
2706         as_bad (_("bad argument to %s_check directive."), str);
2707       (void) restore_line_pointer (e);
2708     }
2709   else
2710     as_bad (_("missing argument for %s_check directive"), str);
2711
2712   demand_empty_rest_of_line ();
2713 }
2714
2715 static void
2716 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2717                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2718 {
2719 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2720   static const char *arch;
2721
2722   /* Intel LIOM is only supported on ELF.  */
2723   if (!IS_ELF)
2724     return;
2725
2726   if (!arch)
2727     {
2728       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2729          use default_arch.  */
2730       arch = cpu_arch_name;
2731       if (!arch)
2732         arch = default_arch;
2733     }
2734
2735   /* If we are targeting Intel MCU, we must enable it.  */
2736   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2737       || new_flag.bitfield.cpuiamcu)
2738     return;
2739
2740   /* If we are targeting Intel L1OM, we must enable it.  */
2741   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2742       || new_flag.bitfield.cpul1om)
2743     return;
2744
2745   /* If we are targeting Intel K1OM, we must enable it.  */
2746   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2747       || new_flag.bitfield.cpuk1om)
2748     return;
2749
2750   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2751 #endif
2752 }
2753
2754 static void
2755 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2756 {
2757   SKIP_WHITESPACE ();
2758
2759   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2760     {
2761       char *string;
2762       int e = get_symbol_name (&string);
2763       unsigned int j;
2764       i386_cpu_flags flags;
2765
2766       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2767         {
2768           if (strcmp (string, cpu_arch[j].name) == 0)
2769             {
2770               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2771
2772               if (*string != '.')
2773                 {
2774                   cpu_arch_name = cpu_arch[j].name;
2775                   cpu_sub_arch_name = NULL;
2776                   cpu_arch_flags = cpu_arch[j].flags;
2777                   if (flag_code == CODE_64BIT)
2778                     {
2779                       cpu_arch_flags.bitfield.cpu64 = 1;
2780                       cpu_arch_flags.bitfield.cpuno64 = 0;
2781                     }
2782                   else
2783                     {
2784                       cpu_arch_flags.bitfield.cpu64 = 0;
2785                       cpu_arch_flags.bitfield.cpuno64 = 1;
2786                     }
2787                   cpu_arch_isa = cpu_arch[j].type;
2788                   cpu_arch_isa_flags = cpu_arch[j].flags;
2789                   if (!cpu_arch_tune_set)
2790                     {
2791                       cpu_arch_tune = cpu_arch_isa;
2792                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2793                     }
2794                   break;
2795                 }
2796
2797               flags = cpu_flags_or (cpu_arch_flags,
2798                                     cpu_arch[j].flags);
2799
2800               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2801                 {
2802                   if (cpu_sub_arch_name)
2803                     {
2804                       char *name = cpu_sub_arch_name;
2805                       cpu_sub_arch_name = concat (name,
2806                                                   cpu_arch[j].name,
2807                                                   (const char *) NULL);
2808                       free (name);
2809                     }
2810                   else
2811                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2812                   cpu_arch_flags = flags;
2813                   cpu_arch_isa_flags = flags;
2814                 }
2815               else
2816                 cpu_arch_isa_flags
2817                   = cpu_flags_or (cpu_arch_isa_flags,
2818                                   cpu_arch[j].flags);
2819               (void) restore_line_pointer (e);
2820               demand_empty_rest_of_line ();
2821               return;
2822             }
2823         }
2824
2825       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2826         {
2827           /* Disable an ISA extension.  */
2828           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2829             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2830               {
2831                 flags = cpu_flags_and_not (cpu_arch_flags,
2832                                            cpu_noarch[j].flags);
2833                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2834                   {
2835                     if (cpu_sub_arch_name)
2836                       {
2837                         char *name = cpu_sub_arch_name;
2838                         cpu_sub_arch_name = concat (name, string,
2839                                                     (const char *) NULL);
2840                         free (name);
2841                       }
2842                     else
2843                       cpu_sub_arch_name = xstrdup (string);
2844                     cpu_arch_flags = flags;
2845                     cpu_arch_isa_flags = flags;
2846                   }
2847                 (void) restore_line_pointer (e);
2848                 demand_empty_rest_of_line ();
2849                 return;
2850               }
2851
2852           j = ARRAY_SIZE (cpu_arch);
2853         }
2854
2855       if (j >= ARRAY_SIZE (cpu_arch))
2856         as_bad (_("no such architecture: `%s'"), string);
2857
2858       *input_line_pointer = e;
2859     }
2860   else
2861     as_bad (_("missing cpu architecture"));
2862
2863   no_cond_jump_promotion = 0;
2864   if (*input_line_pointer == ','
2865       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2866     {
2867       char *string;
2868       char e;
2869
2870       ++input_line_pointer;
2871       e = get_symbol_name (&string);
2872
2873       if (strcmp (string, "nojumps") == 0)
2874         no_cond_jump_promotion = 1;
2875       else if (strcmp (string, "jumps") == 0)
2876         ;
2877       else
2878         as_bad (_("no such architecture modifier: `%s'"), string);
2879
2880       (void) restore_line_pointer (e);
2881     }
2882
2883   demand_empty_rest_of_line ();
2884 }
2885
2886 enum bfd_architecture
2887 i386_arch (void)
2888 {
2889   if (cpu_arch_isa == PROCESSOR_L1OM)
2890     {
2891       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2892           || flag_code != CODE_64BIT)
2893         as_fatal (_("Intel L1OM is 64bit ELF only"));
2894       return bfd_arch_l1om;
2895     }
2896   else if (cpu_arch_isa == PROCESSOR_K1OM)
2897     {
2898       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2899           || flag_code != CODE_64BIT)
2900         as_fatal (_("Intel K1OM is 64bit ELF only"));
2901       return bfd_arch_k1om;
2902     }
2903   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2904     {
2905       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2906           || flag_code == CODE_64BIT)
2907         as_fatal (_("Intel MCU is 32bit ELF only"));
2908       return bfd_arch_iamcu;
2909     }
2910   else
2911     return bfd_arch_i386;
2912 }
2913
2914 unsigned long
2915 i386_mach (void)
2916 {
2917   if (!strncmp (default_arch, "x86_64", 6))
2918     {
2919       if (cpu_arch_isa == PROCESSOR_L1OM)
2920         {
2921           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2922               || default_arch[6] != '\0')
2923             as_fatal (_("Intel L1OM is 64bit ELF only"));
2924           return bfd_mach_l1om;
2925         }
2926       else if (cpu_arch_isa == PROCESSOR_K1OM)
2927         {
2928           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2929               || default_arch[6] != '\0')
2930             as_fatal (_("Intel K1OM is 64bit ELF only"));
2931           return bfd_mach_k1om;
2932         }
2933       else if (default_arch[6] == '\0')
2934         return bfd_mach_x86_64;
2935       else
2936         return bfd_mach_x64_32;
2937     }
2938   else if (!strcmp (default_arch, "i386")
2939            || !strcmp (default_arch, "iamcu"))
2940     {
2941       if (cpu_arch_isa == PROCESSOR_IAMCU)
2942         {
2943           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2944             as_fatal (_("Intel MCU is 32bit ELF only"));
2945           return bfd_mach_i386_iamcu;
2946         }
2947       else
2948         return bfd_mach_i386_i386;
2949     }
2950   else
2951     as_fatal (_("unknown architecture"));
2952 }
2953 \f
2954 void
2955 md_begin (void)
2956 {
2957   const char *hash_err;
2958
2959   /* Support pseudo prefixes like {disp32}.  */
2960   lex_type ['{'] = LEX_BEGIN_NAME;
2961
2962   /* Initialize op_hash hash table.  */
2963   op_hash = hash_new ();
2964
2965   {
2966     const insn_template *optab;
2967     templates *core_optab;
2968
2969     /* Setup for loop.  */
2970     optab = i386_optab;
2971     core_optab = XNEW (templates);
2972     core_optab->start = optab;
2973
2974     while (1)
2975       {
2976         ++optab;
2977         if (optab->name == NULL
2978             || strcmp (optab->name, (optab - 1)->name) != 0)
2979           {
2980             /* different name --> ship out current template list;
2981                add to hash table; & begin anew.  */
2982             core_optab->end = optab;
2983             hash_err = hash_insert (op_hash,
2984                                     (optab - 1)->name,
2985                                     (void *) core_optab);
2986             if (hash_err)
2987               {
2988                 as_fatal (_("can't hash %s: %s"),
2989                           (optab - 1)->name,
2990                           hash_err);
2991               }
2992             if (optab->name == NULL)
2993               break;
2994             core_optab = XNEW (templates);
2995             core_optab->start = optab;
2996           }
2997       }
2998   }
2999
3000   /* Initialize reg_hash hash table.  */
3001   reg_hash = hash_new ();
3002   {
3003     const reg_entry *regtab;
3004     unsigned int regtab_size = i386_regtab_size;
3005
3006     for (regtab = i386_regtab; regtab_size--; regtab++)
3007       {
3008         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3009         if (hash_err)
3010           as_fatal (_("can't hash %s: %s"),
3011                     regtab->reg_name,
3012                     hash_err);
3013       }
3014   }
3015
3016   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3017   {
3018     int c;
3019     char *p;
3020
3021     for (c = 0; c < 256; c++)
3022       {
3023         if (ISDIGIT (c))
3024           {
3025             digit_chars[c] = c;
3026             mnemonic_chars[c] = c;
3027             register_chars[c] = c;
3028             operand_chars[c] = c;
3029           }
3030         else if (ISLOWER (c))
3031           {
3032             mnemonic_chars[c] = c;
3033             register_chars[c] = c;
3034             operand_chars[c] = c;
3035           }
3036         else if (ISUPPER (c))
3037           {
3038             mnemonic_chars[c] = TOLOWER (c);
3039             register_chars[c] = mnemonic_chars[c];
3040             operand_chars[c] = c;
3041           }
3042         else if (c == '{' || c == '}')
3043           {
3044             mnemonic_chars[c] = c;
3045             operand_chars[c] = c;
3046           }
3047
3048         if (ISALPHA (c) || ISDIGIT (c))
3049           identifier_chars[c] = c;
3050         else if (c >= 128)
3051           {
3052             identifier_chars[c] = c;
3053             operand_chars[c] = c;
3054           }
3055       }
3056
3057 #ifdef LEX_AT
3058     identifier_chars['@'] = '@';
3059 #endif
3060 #ifdef LEX_QM
3061     identifier_chars['?'] = '?';
3062     operand_chars['?'] = '?';
3063 #endif
3064     digit_chars['-'] = '-';
3065     mnemonic_chars['_'] = '_';
3066     mnemonic_chars['-'] = '-';
3067     mnemonic_chars['.'] = '.';
3068     identifier_chars['_'] = '_';
3069     identifier_chars['.'] = '.';
3070
3071     for (p = operand_special_chars; *p != '\0'; p++)
3072       operand_chars[(unsigned char) *p] = *p;
3073   }
3074
3075   if (flag_code == CODE_64BIT)
3076     {
3077 #if defined (OBJ_COFF) && defined (TE_PE)
3078       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3079                                   ? 32 : 16);
3080 #else
3081       x86_dwarf2_return_column = 16;
3082 #endif
3083       x86_cie_data_alignment = -8;
3084     }
3085   else
3086     {
3087       x86_dwarf2_return_column = 8;
3088       x86_cie_data_alignment = -4;
3089     }
3090
3091   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3092      can be turned into BRANCH_PREFIX frag.  */
3093   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3094     abort ();
3095 }
3096
3097 void
3098 i386_print_statistics (FILE *file)
3099 {
3100   hash_print_statistics (file, "i386 opcode", op_hash);
3101   hash_print_statistics (file, "i386 register", reg_hash);
3102 }
3103 \f
3104 #ifdef DEBUG386
3105
3106 /* Debugging routines for md_assemble.  */
3107 static void pte (insn_template *);
3108 static void pt (i386_operand_type);
3109 static void pe (expressionS *);
3110 static void ps (symbolS *);
3111
3112 static void
3113 pi (const char *line, i386_insn *x)
3114 {
3115   unsigned int j;
3116
3117   fprintf (stdout, "%s: template ", line);
3118   pte (&x->tm);
3119   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3120            x->base_reg ? x->base_reg->reg_name : "none",
3121            x->index_reg ? x->index_reg->reg_name : "none",
3122            x->log2_scale_factor);
3123   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3124            x->rm.mode, x->rm.reg, x->rm.regmem);
3125   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3126            x->sib.base, x->sib.index, x->sib.scale);
3127   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3128            (x->rex & REX_W) != 0,
3129            (x->rex & REX_R) != 0,
3130            (x->rex & REX_X) != 0,
3131            (x->rex & REX_B) != 0);
3132   for (j = 0; j < x->operands; j++)
3133     {
3134       fprintf (stdout, "    #%d:  ", j + 1);
3135       pt (x->types[j]);
3136       fprintf (stdout, "\n");
3137       if (x->types[j].bitfield.class == Reg
3138           || x->types[j].bitfield.class == RegMMX
3139           || x->types[j].bitfield.class == RegSIMD
3140           || x->types[j].bitfield.class == SReg
3141           || x->types[j].bitfield.class == RegCR
3142           || x->types[j].bitfield.class == RegDR
3143           || x->types[j].bitfield.class == RegTR)
3144         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3145       if (operand_type_check (x->types[j], imm))
3146         pe (x->op[j].imms);
3147       if (operand_type_check (x->types[j], disp))
3148         pe (x->op[j].disps);
3149     }
3150 }
3151
3152 static void
3153 pte (insn_template *t)
3154 {
3155   unsigned int j;
3156   fprintf (stdout, " %d operands ", t->operands);
3157   fprintf (stdout, "opcode %x ", t->base_opcode);
3158   if (t->extension_opcode != None)
3159     fprintf (stdout, "ext %x ", t->extension_opcode);
3160   if (t->opcode_modifier.d)
3161     fprintf (stdout, "D");
3162   if (t->opcode_modifier.w)
3163     fprintf (stdout, "W");
3164   fprintf (stdout, "\n");
3165   for (j = 0; j < t->operands; j++)
3166     {
3167       fprintf (stdout, "    #%d type ", j + 1);
3168       pt (t->operand_types[j]);
3169       fprintf (stdout, "\n");
3170     }
3171 }
3172
3173 static void
3174 pe (expressionS *e)
3175 {
3176   fprintf (stdout, "    operation     %d\n", e->X_op);
3177   fprintf (stdout, "    add_number    %ld (%lx)\n",
3178            (long) e->X_add_number, (long) e->X_add_number);
3179   if (e->X_add_symbol)
3180     {
3181       fprintf (stdout, "    add_symbol    ");
3182       ps (e->X_add_symbol);
3183       fprintf (stdout, "\n");
3184     }
3185   if (e->X_op_symbol)
3186     {
3187       fprintf (stdout, "    op_symbol    ");
3188       ps (e->X_op_symbol);
3189       fprintf (stdout, "\n");
3190     }
3191 }
3192
3193 static void
3194 ps (symbolS *s)
3195 {
3196   fprintf (stdout, "%s type %s%s",
3197            S_GET_NAME (s),
3198            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3199            segment_name (S_GET_SEGMENT (s)));
3200 }
3201
3202 static struct type_name
3203   {
3204     i386_operand_type mask;
3205     const char *name;
3206   }
3207 const type_names[] =
3208 {
3209   { OPERAND_TYPE_REG8, "r8" },
3210   { OPERAND_TYPE_REG16, "r16" },
3211   { OPERAND_TYPE_REG32, "r32" },
3212   { OPERAND_TYPE_REG64, "r64" },
3213   { OPERAND_TYPE_ACC8, "acc8" },
3214   { OPERAND_TYPE_ACC16, "acc16" },
3215   { OPERAND_TYPE_ACC32, "acc32" },
3216   { OPERAND_TYPE_ACC64, "acc64" },
3217   { OPERAND_TYPE_IMM8, "i8" },
3218   { OPERAND_TYPE_IMM8, "i8s" },
3219   { OPERAND_TYPE_IMM16, "i16" },
3220   { OPERAND_TYPE_IMM32, "i32" },
3221   { OPERAND_TYPE_IMM32S, "i32s" },
3222   { OPERAND_TYPE_IMM64, "i64" },
3223   { OPERAND_TYPE_IMM1, "i1" },
3224   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3225   { OPERAND_TYPE_DISP8, "d8" },
3226   { OPERAND_TYPE_DISP16, "d16" },
3227   { OPERAND_TYPE_DISP32, "d32" },
3228   { OPERAND_TYPE_DISP32S, "d32s" },
3229   { OPERAND_TYPE_DISP64, "d64" },
3230   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3231   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3232   { OPERAND_TYPE_CONTROL, "control reg" },
3233   { OPERAND_TYPE_TEST, "test reg" },
3234   { OPERAND_TYPE_DEBUG, "debug reg" },
3235   { OPERAND_TYPE_FLOATREG, "FReg" },
3236   { OPERAND_TYPE_FLOATACC, "FAcc" },
3237   { OPERAND_TYPE_SREG, "SReg" },
3238   { OPERAND_TYPE_REGMMX, "rMMX" },
3239   { OPERAND_TYPE_REGXMM, "rXMM" },
3240   { OPERAND_TYPE_REGYMM, "rYMM" },
3241   { OPERAND_TYPE_REGZMM, "rZMM" },
3242   { OPERAND_TYPE_REGMASK, "Mask reg" },
3243 };
3244
3245 static void
3246 pt (i386_operand_type t)
3247 {
3248   unsigned int j;
3249   i386_operand_type a;
3250
3251   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3252     {
3253       a = operand_type_and (t, type_names[j].mask);
3254       if (operand_type_equal (&a, &type_names[j].mask))
3255         fprintf (stdout, "%s, ",  type_names[j].name);
3256     }
3257   fflush (stdout);
3258 }
3259
3260 #endif /* DEBUG386 */
3261 \f
3262 static bfd_reloc_code_real_type
3263 reloc (unsigned int size,
3264        int pcrel,
3265        int sign,
3266        bfd_reloc_code_real_type other)
3267 {
3268   if (other != NO_RELOC)
3269     {
3270       reloc_howto_type *rel;
3271
3272       if (size == 8)
3273         switch (other)
3274           {
3275           case BFD_RELOC_X86_64_GOT32:
3276             return BFD_RELOC_X86_64_GOT64;
3277             break;
3278           case BFD_RELOC_X86_64_GOTPLT64:
3279             return BFD_RELOC_X86_64_GOTPLT64;
3280             break;
3281           case BFD_RELOC_X86_64_PLTOFF64:
3282             return BFD_RELOC_X86_64_PLTOFF64;
3283             break;
3284           case BFD_RELOC_X86_64_GOTPC32:
3285             other = BFD_RELOC_X86_64_GOTPC64;
3286             break;
3287           case BFD_RELOC_X86_64_GOTPCREL:
3288             other = BFD_RELOC_X86_64_GOTPCREL64;
3289             break;
3290           case BFD_RELOC_X86_64_TPOFF32:
3291             other = BFD_RELOC_X86_64_TPOFF64;
3292             break;
3293           case BFD_RELOC_X86_64_DTPOFF32:
3294             other = BFD_RELOC_X86_64_DTPOFF64;
3295             break;
3296           default:
3297             break;
3298           }
3299
3300 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3301       if (other == BFD_RELOC_SIZE32)
3302         {
3303           if (size == 8)
3304             other = BFD_RELOC_SIZE64;
3305           if (pcrel)
3306             {
3307               as_bad (_("there are no pc-relative size relocations"));
3308               return NO_RELOC;
3309             }
3310         }
3311 #endif
3312
3313       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3314       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3315         sign = -1;
3316
3317       rel = bfd_reloc_type_lookup (stdoutput, other);
3318       if (!rel)
3319         as_bad (_("unknown relocation (%u)"), other);
3320       else if (size != bfd_get_reloc_size (rel))
3321         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3322                 bfd_get_reloc_size (rel),
3323                 size);
3324       else if (pcrel && !rel->pc_relative)
3325         as_bad (_("non-pc-relative relocation for pc-relative field"));
3326       else if ((rel->complain_on_overflow == complain_overflow_signed
3327                 && !sign)
3328                || (rel->complain_on_overflow == complain_overflow_unsigned
3329                    && sign > 0))
3330         as_bad (_("relocated field and relocation type differ in signedness"));
3331       else
3332         return other;
3333       return NO_RELOC;
3334     }
3335
3336   if (pcrel)
3337     {
3338       if (!sign)
3339         as_bad (_("there are no unsigned pc-relative relocations"));
3340       switch (size)
3341         {
3342         case 1: return BFD_RELOC_8_PCREL;
3343         case 2: return BFD_RELOC_16_PCREL;
3344         case 4: return BFD_RELOC_32_PCREL;
3345         case 8: return BFD_RELOC_64_PCREL;
3346         }
3347       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3348     }
3349   else
3350     {
3351       if (sign > 0)
3352         switch (size)
3353           {
3354           case 4: return BFD_RELOC_X86_64_32S;
3355           }
3356       else
3357         switch (size)
3358           {
3359           case 1: return BFD_RELOC_8;
3360           case 2: return BFD_RELOC_16;
3361           case 4: return BFD_RELOC_32;
3362           case 8: return BFD_RELOC_64;
3363           }
3364       as_bad (_("cannot do %s %u byte relocation"),
3365               sign > 0 ? "signed" : "unsigned", size);
3366     }
3367
3368   return NO_RELOC;
3369 }
3370
3371 /* Here we decide which fixups can be adjusted to make them relative to
3372    the beginning of the section instead of the symbol.  Basically we need
3373    to make sure that the dynamic relocations are done correctly, so in
3374    some cases we force the original symbol to be used.  */
3375
3376 int
3377 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3378 {
3379 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3380   if (!IS_ELF)
3381     return 1;
3382
3383   /* Don't adjust pc-relative references to merge sections in 64-bit
3384      mode.  */
3385   if (use_rela_relocations
3386       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3387       && fixP->fx_pcrel)
3388     return 0;
3389
3390   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3391      and changed later by validate_fix.  */
3392   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3393       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3394     return 0;
3395
3396   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3397      for size relocations.  */
3398   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3399       || fixP->fx_r_type == BFD_RELOC_SIZE64
3400       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3401       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3402       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3403       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3404       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3405       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3406       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3407       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3408       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3409       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3410       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3411       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3412       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3413       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3414       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3415       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3416       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3417       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3418       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3419       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3420       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3421       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3422       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3423       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3424       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3425       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3426       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3427       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3428       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3429     return 0;
3430 #endif
3431   return 1;
3432 }
3433
3434 static int
3435 intel_float_operand (const char *mnemonic)
3436 {
3437   /* Note that the value returned is meaningful only for opcodes with (memory)
3438      operands, hence the code here is free to improperly handle opcodes that
3439      have no operands (for better performance and smaller code). */
3440
3441   if (mnemonic[0] != 'f')
3442     return 0; /* non-math */
3443
3444   switch (mnemonic[1])
3445     {
3446     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3447        the fs segment override prefix not currently handled because no
3448        call path can make opcodes without operands get here */
3449     case 'i':
3450       return 2 /* integer op */;
3451     case 'l':
3452       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3453         return 3; /* fldcw/fldenv */
3454       break;
3455     case 'n':
3456       if (mnemonic[2] != 'o' /* fnop */)
3457         return 3; /* non-waiting control op */
3458       break;
3459     case 'r':
3460       if (mnemonic[2] == 's')
3461         return 3; /* frstor/frstpm */
3462       break;
3463     case 's':
3464       if (mnemonic[2] == 'a')
3465         return 3; /* fsave */
3466       if (mnemonic[2] == 't')
3467         {
3468           switch (mnemonic[3])
3469             {
3470             case 'c': /* fstcw */
3471             case 'd': /* fstdw */
3472             case 'e': /* fstenv */
3473             case 's': /* fsts[gw] */
3474               return 3;
3475             }
3476         }
3477       break;
3478     case 'x':
3479       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3480         return 0; /* fxsave/fxrstor are not really math ops */
3481       break;
3482     }
3483
3484   return 1;
3485 }
3486
3487 /* Build the VEX prefix.  */
3488
3489 static void
3490 build_vex_prefix (const insn_template *t)
3491 {
3492   unsigned int register_specifier;
3493   unsigned int implied_prefix;
3494   unsigned int vector_length;
3495   unsigned int w;
3496
3497   /* Check register specifier.  */
3498   if (i.vex.register_specifier)
3499     {
3500       register_specifier =
3501         ~register_number (i.vex.register_specifier) & 0xf;
3502       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3503     }
3504   else
3505     register_specifier = 0xf;
3506
3507   /* Use 2-byte VEX prefix by swapping destination and source operand
3508      if there are more than 1 register operand.  */
3509   if (i.reg_operands > 1
3510       && i.vec_encoding != vex_encoding_vex3
3511       && i.dir_encoding == dir_encoding_default
3512       && i.operands == i.reg_operands
3513       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3514       && i.tm.opcode_modifier.vexopcode == VEX0F
3515       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3516       && i.rex == REX_B)
3517     {
3518       unsigned int xchg = i.operands - 1;
3519       union i386_op temp_op;
3520       i386_operand_type temp_type;
3521
3522       temp_type = i.types[xchg];
3523       i.types[xchg] = i.types[0];
3524       i.types[0] = temp_type;
3525       temp_op = i.op[xchg];
3526       i.op[xchg] = i.op[0];
3527       i.op[0] = temp_op;
3528
3529       gas_assert (i.rm.mode == 3);
3530
3531       i.rex = REX_R;
3532       xchg = i.rm.regmem;
3533       i.rm.regmem = i.rm.reg;
3534       i.rm.reg = xchg;
3535
3536       if (i.tm.opcode_modifier.d)
3537         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3538                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3539       else /* Use the next insn.  */
3540         i.tm = t[1];
3541     }
3542
3543   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3544      are no memory operands and at least 3 register ones.  */
3545   if (i.reg_operands >= 3
3546       && i.vec_encoding != vex_encoding_vex3
3547       && i.reg_operands == i.operands - i.imm_operands
3548       && i.tm.opcode_modifier.vex
3549       && i.tm.opcode_modifier.commutative
3550       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3551       && i.rex == REX_B
3552       && i.vex.register_specifier
3553       && !(i.vex.register_specifier->reg_flags & RegRex))
3554     {
3555       unsigned int xchg = i.operands - i.reg_operands;
3556       union i386_op temp_op;
3557       i386_operand_type temp_type;
3558
3559       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3560       gas_assert (!i.tm.opcode_modifier.sae);
3561       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3562                                       &i.types[i.operands - 3]));
3563       gas_assert (i.rm.mode == 3);
3564
3565       temp_type = i.types[xchg];
3566       i.types[xchg] = i.types[xchg + 1];
3567       i.types[xchg + 1] = temp_type;
3568       temp_op = i.op[xchg];
3569       i.op[xchg] = i.op[xchg + 1];
3570       i.op[xchg + 1] = temp_op;
3571
3572       i.rex = 0;
3573       xchg = i.rm.regmem | 8;
3574       i.rm.regmem = ~register_specifier & 0xf;
3575       gas_assert (!(i.rm.regmem & 8));
3576       i.vex.register_specifier += xchg - i.rm.regmem;
3577       register_specifier = ~xchg & 0xf;
3578     }
3579
3580   if (i.tm.opcode_modifier.vex == VEXScalar)
3581     vector_length = avxscalar;
3582   else if (i.tm.opcode_modifier.vex == VEX256)
3583     vector_length = 1;
3584   else
3585     {
3586       unsigned int op;
3587
3588       /* Determine vector length from the last multi-length vector
3589          operand.  */
3590       vector_length = 0;
3591       for (op = t->operands; op--;)
3592         if (t->operand_types[op].bitfield.xmmword
3593             && t->operand_types[op].bitfield.ymmword
3594             && i.types[op].bitfield.ymmword)
3595           {
3596             vector_length = 1;
3597             break;
3598           }
3599     }
3600
3601   switch ((i.tm.base_opcode >> 8) & 0xff)
3602     {
3603     case 0:
3604       implied_prefix = 0;
3605       break;
3606     case DATA_PREFIX_OPCODE:
3607       implied_prefix = 1;
3608       break;
3609     case REPE_PREFIX_OPCODE:
3610       implied_prefix = 2;
3611       break;
3612     case REPNE_PREFIX_OPCODE:
3613       implied_prefix = 3;
3614       break;
3615     default:
3616       abort ();
3617     }
3618
3619   /* Check the REX.W bit and VEXW.  */
3620   if (i.tm.opcode_modifier.vexw == VEXWIG)
3621     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3622   else if (i.tm.opcode_modifier.vexw)
3623     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3624   else
3625     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3626
3627   /* Use 2-byte VEX prefix if possible.  */
3628   if (w == 0
3629       && i.vec_encoding != vex_encoding_vex3
3630       && i.tm.opcode_modifier.vexopcode == VEX0F
3631       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3632     {
3633       /* 2-byte VEX prefix.  */
3634       unsigned int r;
3635
3636       i.vex.length = 2;
3637       i.vex.bytes[0] = 0xc5;
3638
3639       /* Check the REX.R bit.  */
3640       r = (i.rex & REX_R) ? 0 : 1;
3641       i.vex.bytes[1] = (r << 7
3642                         | register_specifier << 3
3643                         | vector_length << 2
3644                         | implied_prefix);
3645     }
3646   else
3647     {
3648       /* 3-byte VEX prefix.  */
3649       unsigned int m;
3650
3651       i.vex.length = 3;
3652
3653       switch (i.tm.opcode_modifier.vexopcode)
3654         {
3655         case VEX0F:
3656           m = 0x1;
3657           i.vex.bytes[0] = 0xc4;
3658           break;
3659         case VEX0F38:
3660           m = 0x2;
3661           i.vex.bytes[0] = 0xc4;
3662           break;
3663         case VEX0F3A:
3664           m = 0x3;
3665           i.vex.bytes[0] = 0xc4;
3666           break;
3667         case XOP08:
3668           m = 0x8;
3669           i.vex.bytes[0] = 0x8f;
3670           break;
3671         case XOP09:
3672           m = 0x9;
3673           i.vex.bytes[0] = 0x8f;
3674           break;
3675         case XOP0A:
3676           m = 0xa;
3677           i.vex.bytes[0] = 0x8f;
3678           break;
3679         default:
3680           abort ();
3681         }
3682
3683       /* The high 3 bits of the second VEX byte are 1's compliment
3684          of RXB bits from REX.  */
3685       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3686
3687       i.vex.bytes[2] = (w << 7
3688                         | register_specifier << 3
3689                         | vector_length << 2
3690                         | implied_prefix);
3691     }
3692 }
3693
3694 static INLINE bfd_boolean
3695 is_evex_encoding (const insn_template *t)
3696 {
3697   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3698          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3699          || t->opcode_modifier.sae;
3700 }
3701
3702 static INLINE bfd_boolean
3703 is_any_vex_encoding (const insn_template *t)
3704 {
3705   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3706          || is_evex_encoding (t);
3707 }
3708
3709 /* Build the EVEX prefix.  */
3710
3711 static void
3712 build_evex_prefix (void)
3713 {
3714   unsigned int register_specifier;
3715   unsigned int implied_prefix;
3716   unsigned int m, w;
3717   rex_byte vrex_used = 0;
3718
3719   /* Check register specifier.  */
3720   if (i.vex.register_specifier)
3721     {
3722       gas_assert ((i.vrex & REX_X) == 0);
3723
3724       register_specifier = i.vex.register_specifier->reg_num;
3725       if ((i.vex.register_specifier->reg_flags & RegRex))
3726         register_specifier += 8;
3727       /* The upper 16 registers are encoded in the fourth byte of the
3728          EVEX prefix.  */
3729       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3730         i.vex.bytes[3] = 0x8;
3731       register_specifier = ~register_specifier & 0xf;
3732     }
3733   else
3734     {
3735       register_specifier = 0xf;
3736
3737       /* Encode upper 16 vector index register in the fourth byte of
3738          the EVEX prefix.  */
3739       if (!(i.vrex & REX_X))
3740         i.vex.bytes[3] = 0x8;
3741       else
3742         vrex_used |= REX_X;
3743     }
3744
3745   switch ((i.tm.base_opcode >> 8) & 0xff)
3746     {
3747     case 0:
3748       implied_prefix = 0;
3749       break;
3750     case DATA_PREFIX_OPCODE:
3751       implied_prefix = 1;
3752       break;
3753     case REPE_PREFIX_OPCODE:
3754       implied_prefix = 2;
3755       break;
3756     case REPNE_PREFIX_OPCODE:
3757       implied_prefix = 3;
3758       break;
3759     default:
3760       abort ();
3761     }
3762
3763   /* 4 byte EVEX prefix.  */
3764   i.vex.length = 4;
3765   i.vex.bytes[0] = 0x62;
3766
3767   /* mmmm bits.  */
3768   switch (i.tm.opcode_modifier.vexopcode)
3769     {
3770     case VEX0F:
3771       m = 1;
3772       break;
3773     case VEX0F38:
3774       m = 2;
3775       break;
3776     case VEX0F3A:
3777       m = 3;
3778       break;
3779     default:
3780       abort ();
3781       break;
3782     }
3783
3784   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3785      bits from REX.  */
3786   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3787
3788   /* The fifth bit of the second EVEX byte is 1's compliment of the
3789      REX_R bit in VREX.  */
3790   if (!(i.vrex & REX_R))
3791     i.vex.bytes[1] |= 0x10;
3792   else
3793     vrex_used |= REX_R;
3794
3795   if ((i.reg_operands + i.imm_operands) == i.operands)
3796     {
3797       /* When all operands are registers, the REX_X bit in REX is not
3798          used.  We reuse it to encode the upper 16 registers, which is
3799          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3800          as 1's compliment.  */
3801       if ((i.vrex & REX_B))
3802         {
3803           vrex_used |= REX_B;
3804           i.vex.bytes[1] &= ~0x40;
3805         }
3806     }
3807
3808   /* EVEX instructions shouldn't need the REX prefix.  */
3809   i.vrex &= ~vrex_used;
3810   gas_assert (i.vrex == 0);
3811
3812   /* Check the REX.W bit and VEXW.  */
3813   if (i.tm.opcode_modifier.vexw == VEXWIG)
3814     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3815   else if (i.tm.opcode_modifier.vexw)
3816     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3817   else
3818     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3819
3820   /* Encode the U bit.  */
3821   implied_prefix |= 0x4;
3822
3823   /* The third byte of the EVEX prefix.  */
3824   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3825
3826   /* The fourth byte of the EVEX prefix.  */
3827   /* The zeroing-masking bit.  */
3828   if (i.mask && i.mask->zeroing)
3829     i.vex.bytes[3] |= 0x80;
3830
3831   /* Don't always set the broadcast bit if there is no RC.  */
3832   if (!i.rounding)
3833     {
3834       /* Encode the vector length.  */
3835       unsigned int vec_length;
3836
3837       if (!i.tm.opcode_modifier.evex
3838           || i.tm.opcode_modifier.evex == EVEXDYN)
3839         {
3840           unsigned int op;
3841
3842           /* Determine vector length from the last multi-length vector
3843              operand.  */
3844           vec_length = 0;
3845           for (op = i.operands; op--;)
3846             if (i.tm.operand_types[op].bitfield.xmmword
3847                 + i.tm.operand_types[op].bitfield.ymmword
3848                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3849               {
3850                 if (i.types[op].bitfield.zmmword)
3851                   {
3852                     i.tm.opcode_modifier.evex = EVEX512;
3853                     break;
3854                   }
3855                 else if (i.types[op].bitfield.ymmword)
3856                   {
3857                     i.tm.opcode_modifier.evex = EVEX256;
3858                     break;
3859                   }
3860                 else if (i.types[op].bitfield.xmmword)
3861                   {
3862                     i.tm.opcode_modifier.evex = EVEX128;
3863                     break;
3864                   }
3865                 else if (i.broadcast && (int) op == i.broadcast->operand)
3866                   {
3867                     switch (i.broadcast->bytes)
3868                       {
3869                         case 64:
3870                           i.tm.opcode_modifier.evex = EVEX512;
3871                           break;
3872                         case 32:
3873                           i.tm.opcode_modifier.evex = EVEX256;
3874                           break;
3875                         case 16:
3876                           i.tm.opcode_modifier.evex = EVEX128;
3877                           break;
3878                         default:
3879                           abort ();
3880                       }
3881                     break;
3882                   }
3883               }
3884
3885           if (op >= MAX_OPERANDS)
3886             abort ();
3887         }
3888
3889       switch (i.tm.opcode_modifier.evex)
3890         {
3891         case EVEXLIG: /* LL' is ignored */
3892           vec_length = evexlig << 5;
3893           break;
3894         case EVEX128:
3895           vec_length = 0 << 5;
3896           break;
3897         case EVEX256:
3898           vec_length = 1 << 5;
3899           break;
3900         case EVEX512:
3901           vec_length = 2 << 5;
3902           break;
3903         default:
3904           abort ();
3905           break;
3906         }
3907       i.vex.bytes[3] |= vec_length;
3908       /* Encode the broadcast bit.  */
3909       if (i.broadcast)
3910         i.vex.bytes[3] |= 0x10;
3911     }
3912   else
3913     {
3914       if (i.rounding->type != saeonly)
3915         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3916       else
3917         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3918     }
3919
3920   if (i.mask && i.mask->mask)
3921     i.vex.bytes[3] |= i.mask->mask->reg_num;
3922 }
3923
3924 static void
3925 process_immext (void)
3926 {
3927   expressionS *exp;
3928
3929   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3930      which is coded in the same place as an 8-bit immediate field
3931      would be.  Here we fake an 8-bit immediate operand from the
3932      opcode suffix stored in tm.extension_opcode.
3933
3934      AVX instructions also use this encoding, for some of
3935      3 argument instructions.  */
3936
3937   gas_assert (i.imm_operands <= 1
3938               && (i.operands <= 2
3939                   || (is_any_vex_encoding (&i.tm)
3940                       && i.operands <= 4)));
3941
3942   exp = &im_expressions[i.imm_operands++];
3943   i.op[i.operands].imms = exp;
3944   i.types[i.operands] = imm8;
3945   i.operands++;
3946   exp->X_op = O_constant;
3947   exp->X_add_number = i.tm.extension_opcode;
3948   i.tm.extension_opcode = None;
3949 }
3950
3951
3952 static int
3953 check_hle (void)
3954 {
3955   switch (i.tm.opcode_modifier.hleprefixok)
3956     {
3957     default:
3958       abort ();
3959     case HLEPrefixNone:
3960       as_bad (_("invalid instruction `%s' after `%s'"),
3961               i.tm.name, i.hle_prefix);
3962       return 0;
3963     case HLEPrefixLock:
3964       if (i.prefix[LOCK_PREFIX])
3965         return 1;
3966       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3967       return 0;
3968     case HLEPrefixAny:
3969       return 1;
3970     case HLEPrefixRelease:
3971       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3972         {
3973           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3974                   i.tm.name);
3975           return 0;
3976         }
3977       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3978         {
3979           as_bad (_("memory destination needed for instruction `%s'"
3980                     " after `xrelease'"), i.tm.name);
3981           return 0;
3982         }
3983       return 1;
3984     }
3985 }
3986
3987 /* Try the shortest encoding by shortening operand size.  */
3988
3989 static void
3990 optimize_encoding (void)
3991 {
3992   unsigned int j;
3993
3994   if (optimize_for_space
3995       && !is_any_vex_encoding (&i.tm)
3996       && i.reg_operands == 1
3997       && i.imm_operands == 1
3998       && !i.types[1].bitfield.byte
3999       && i.op[0].imms->X_op == O_constant
4000       && fits_in_imm7 (i.op[0].imms->X_add_number)
4001       && (i.tm.base_opcode == 0xa8
4002           || (i.tm.base_opcode == 0xf6
4003               && i.tm.extension_opcode == 0x0)))
4004     {
4005       /* Optimize: -Os:
4006            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4007        */
4008       unsigned int base_regnum = i.op[1].regs->reg_num;
4009       if (flag_code == CODE_64BIT || base_regnum < 4)
4010         {
4011           i.types[1].bitfield.byte = 1;
4012           /* Ignore the suffix.  */
4013           i.suffix = 0;
4014           /* Convert to byte registers.  */
4015           if (i.types[1].bitfield.word)
4016             j = 16;
4017           else if (i.types[1].bitfield.dword)
4018             j = 32;
4019           else
4020             j = 48;
4021           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4022             j += 8;
4023           i.op[1].regs -= j;
4024         }
4025     }
4026   else if (flag_code == CODE_64BIT
4027            && !is_any_vex_encoding (&i.tm)
4028            && ((i.types[1].bitfield.qword
4029                 && i.reg_operands == 1
4030                 && i.imm_operands == 1
4031                 && i.op[0].imms->X_op == O_constant
4032                 && ((i.tm.base_opcode == 0xb8
4033                      && i.tm.extension_opcode == None
4034                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4035                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4036                         && ((i.tm.base_opcode == 0x24
4037                              || i.tm.base_opcode == 0xa8)
4038                             || (i.tm.base_opcode == 0x80
4039                                 && i.tm.extension_opcode == 0x4)
4040                             || ((i.tm.base_opcode == 0xf6
4041                                  || (i.tm.base_opcode | 1) == 0xc7)
4042                                 && i.tm.extension_opcode == 0x0)))
4043                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4044                         && i.tm.base_opcode == 0x83
4045                         && i.tm.extension_opcode == 0x4)))
4046                || (i.types[0].bitfield.qword
4047                    && ((i.reg_operands == 2
4048                         && i.op[0].regs == i.op[1].regs
4049                         && (i.tm.base_opcode == 0x30
4050                             || i.tm.base_opcode == 0x28))
4051                        || (i.reg_operands == 1
4052                            && i.operands == 1
4053                            && i.tm.base_opcode == 0x30)))))
4054     {
4055       /* Optimize: -O:
4056            andq $imm31, %r64   -> andl $imm31, %r32
4057            andq $imm7, %r64    -> andl $imm7, %r32
4058            testq $imm31, %r64  -> testl $imm31, %r32
4059            xorq %r64, %r64     -> xorl %r32, %r32
4060            subq %r64, %r64     -> subl %r32, %r32
4061            movq $imm31, %r64   -> movl $imm31, %r32
4062            movq $imm32, %r64   -> movl $imm32, %r32
4063         */
4064       i.tm.opcode_modifier.norex64 = 1;
4065       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4066         {
4067           /* Handle
4068                movq $imm31, %r64   -> movl $imm31, %r32
4069                movq $imm32, %r64   -> movl $imm32, %r32
4070            */
4071           i.tm.operand_types[0].bitfield.imm32 = 1;
4072           i.tm.operand_types[0].bitfield.imm32s = 0;
4073           i.tm.operand_types[0].bitfield.imm64 = 0;
4074           i.types[0].bitfield.imm32 = 1;
4075           i.types[0].bitfield.imm32s = 0;
4076           i.types[0].bitfield.imm64 = 0;
4077           i.types[1].bitfield.dword = 1;
4078           i.types[1].bitfield.qword = 0;
4079           if ((i.tm.base_opcode | 1) == 0xc7)
4080             {
4081               /* Handle
4082                    movq $imm31, %r64   -> movl $imm31, %r32
4083                */
4084               i.tm.base_opcode = 0xb8;
4085               i.tm.extension_opcode = None;
4086               i.tm.opcode_modifier.w = 0;
4087               i.tm.opcode_modifier.modrm = 0;
4088             }
4089         }
4090     }
4091   else if (optimize > 1
4092            && !optimize_for_space
4093            && !is_any_vex_encoding (&i.tm)
4094            && i.reg_operands == 2
4095            && i.op[0].regs == i.op[1].regs
4096            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4097                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4098            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4099     {
4100       /* Optimize: -O2:
4101            andb %rN, %rN  -> testb %rN, %rN
4102            andw %rN, %rN  -> testw %rN, %rN
4103            andq %rN, %rN  -> testq %rN, %rN
4104            orb %rN, %rN   -> testb %rN, %rN
4105            orw %rN, %rN   -> testw %rN, %rN
4106            orq %rN, %rN   -> testq %rN, %rN
4107
4108            and outside of 64-bit mode
4109
4110            andl %rN, %rN  -> testl %rN, %rN
4111            orl %rN, %rN   -> testl %rN, %rN
4112        */
4113       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4114     }
4115   else if (i.reg_operands == 3
4116            && i.op[0].regs == i.op[1].regs
4117            && !i.types[2].bitfield.xmmword
4118            && (i.tm.opcode_modifier.vex
4119                || ((!i.mask || i.mask->zeroing)
4120                    && !i.rounding
4121                    && is_evex_encoding (&i.tm)
4122                    && (i.vec_encoding != vex_encoding_evex
4123                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4124                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4125                        || (i.tm.operand_types[2].bitfield.zmmword
4126                            && i.types[2].bitfield.ymmword))))
4127            && ((i.tm.base_opcode == 0x55
4128                 || i.tm.base_opcode == 0x6655
4129                 || i.tm.base_opcode == 0x66df
4130                 || i.tm.base_opcode == 0x57
4131                 || i.tm.base_opcode == 0x6657
4132                 || i.tm.base_opcode == 0x66ef
4133                 || i.tm.base_opcode == 0x66f8
4134                 || i.tm.base_opcode == 0x66f9
4135                 || i.tm.base_opcode == 0x66fa
4136                 || i.tm.base_opcode == 0x66fb
4137                 || i.tm.base_opcode == 0x42
4138                 || i.tm.base_opcode == 0x6642
4139                 || i.tm.base_opcode == 0x47
4140                 || i.tm.base_opcode == 0x6647)
4141                && i.tm.extension_opcode == None))
4142     {
4143       /* Optimize: -O1:
4144            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4145            vpsubq and vpsubw:
4146              EVEX VOP %zmmM, %zmmM, %zmmN
4147                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4148                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4149              EVEX VOP %ymmM, %ymmM, %ymmN
4150                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4151                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4152              VEX VOP %ymmM, %ymmM, %ymmN
4153                -> VEX VOP %xmmM, %xmmM, %xmmN
4154            VOP, one of vpandn and vpxor:
4155              VEX VOP %ymmM, %ymmM, %ymmN
4156                -> VEX VOP %xmmM, %xmmM, %xmmN
4157            VOP, one of vpandnd and vpandnq:
4158              EVEX VOP %zmmM, %zmmM, %zmmN
4159                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4160                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4161              EVEX VOP %ymmM, %ymmM, %ymmN
4162                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4163                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4164            VOP, one of vpxord and vpxorq:
4165              EVEX VOP %zmmM, %zmmM, %zmmN
4166                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4167                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4168              EVEX VOP %ymmM, %ymmM, %ymmN
4169                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4170                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4171            VOP, one of kxord and kxorq:
4172              VEX VOP %kM, %kM, %kN
4173                -> VEX kxorw %kM, %kM, %kN
4174            VOP, one of kandnd and kandnq:
4175              VEX VOP %kM, %kM, %kN
4176                -> VEX kandnw %kM, %kM, %kN
4177        */
4178       if (is_evex_encoding (&i.tm))
4179         {
4180           if (i.vec_encoding != vex_encoding_evex)
4181             {
4182               i.tm.opcode_modifier.vex = VEX128;
4183               i.tm.opcode_modifier.vexw = VEXW0;
4184               i.tm.opcode_modifier.evex = 0;
4185             }
4186           else if (optimize > 1)
4187             i.tm.opcode_modifier.evex = EVEX128;
4188           else
4189             return;
4190         }
4191       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4192         {
4193           i.tm.base_opcode &= 0xff;
4194           i.tm.opcode_modifier.vexw = VEXW0;
4195         }
4196       else
4197         i.tm.opcode_modifier.vex = VEX128;
4198
4199       if (i.tm.opcode_modifier.vex)
4200         for (j = 0; j < 3; j++)
4201           {
4202             i.types[j].bitfield.xmmword = 1;
4203             i.types[j].bitfield.ymmword = 0;
4204           }
4205     }
4206   else if (i.vec_encoding != vex_encoding_evex
4207            && !i.types[0].bitfield.zmmword
4208            && !i.types[1].bitfield.zmmword
4209            && !i.mask
4210            && !i.broadcast
4211            && is_evex_encoding (&i.tm)
4212            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4213                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4214                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4215                || (i.tm.base_opcode & ~4) == 0x66db
4216                || (i.tm.base_opcode & ~4) == 0x66eb)
4217            && i.tm.extension_opcode == None)
4218     {
4219       /* Optimize: -O1:
4220            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4221            vmovdqu32 and vmovdqu64:
4222              EVEX VOP %xmmM, %xmmN
4223                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4224              EVEX VOP %ymmM, %ymmN
4225                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4226              EVEX VOP %xmmM, mem
4227                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4228              EVEX VOP %ymmM, mem
4229                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4230              EVEX VOP mem, %xmmN
4231                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4232              EVEX VOP mem, %ymmN
4233                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4234            VOP, one of vpand, vpandn, vpor, vpxor:
4235              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4236                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4237              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4238                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4239              EVEX VOP{d,q} mem, %xmmM, %xmmN
4240                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4241              EVEX VOP{d,q} mem, %ymmM, %ymmN
4242                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4243        */
4244       for (j = 0; j < i.operands; j++)
4245         if (operand_type_check (i.types[j], disp)
4246             && i.op[j].disps->X_op == O_constant)
4247           {
4248             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4249                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4250                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4251             int evex_disp8, vex_disp8;
4252             unsigned int memshift = i.memshift;
4253             offsetT n = i.op[j].disps->X_add_number;
4254
4255             evex_disp8 = fits_in_disp8 (n);
4256             i.memshift = 0;
4257             vex_disp8 = fits_in_disp8 (n);
4258             if (evex_disp8 != vex_disp8)
4259               {
4260                 i.memshift = memshift;
4261                 return;
4262               }
4263
4264             i.types[j].bitfield.disp8 = vex_disp8;
4265             break;
4266           }
4267       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4268         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4269       i.tm.opcode_modifier.vex
4270         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4271       i.tm.opcode_modifier.vexw = VEXW0;
4272       /* VPAND, VPOR, and VPXOR are commutative.  */
4273       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4274         i.tm.opcode_modifier.commutative = 1;
4275       i.tm.opcode_modifier.evex = 0;
4276       i.tm.opcode_modifier.masking = 0;
4277       i.tm.opcode_modifier.broadcast = 0;
4278       i.tm.opcode_modifier.disp8memshift = 0;
4279       i.memshift = 0;
4280       if (j < i.operands)
4281         i.types[j].bitfield.disp8
4282           = fits_in_disp8 (i.op[j].disps->X_add_number);
4283     }
4284 }
4285
4286 /* This is the guts of the machine-dependent assembler.  LINE points to a
4287    machine dependent instruction.  This function is supposed to emit
4288    the frags/bytes it assembles to.  */
4289
4290 void
4291 md_assemble (char *line)
4292 {
4293   unsigned int j;
4294   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4295   const insn_template *t;
4296
4297   /* Initialize globals.  */
4298   memset (&i, '\0', sizeof (i));
4299   for (j = 0; j < MAX_OPERANDS; j++)
4300     i.reloc[j] = NO_RELOC;
4301   memset (disp_expressions, '\0', sizeof (disp_expressions));
4302   memset (im_expressions, '\0', sizeof (im_expressions));
4303   save_stack_p = save_stack;
4304
4305   /* First parse an instruction mnemonic & call i386_operand for the operands.
4306      We assume that the scrubber has arranged it so that line[0] is the valid
4307      start of a (possibly prefixed) mnemonic.  */
4308
4309   line = parse_insn (line, mnemonic);
4310   if (line == NULL)
4311     return;
4312   mnem_suffix = i.suffix;
4313
4314   line = parse_operands (line, mnemonic);
4315   this_operand = -1;
4316   xfree (i.memop1_string);
4317   i.memop1_string = NULL;
4318   if (line == NULL)
4319     return;
4320
4321   /* Now we've parsed the mnemonic into a set of templates, and have the
4322      operands at hand.  */
4323
4324   /* All intel opcodes have reversed operands except for "bound" and
4325      "enter".  We also don't reverse intersegment "jmp" and "call"
4326      instructions with 2 immediate operands so that the immediate segment
4327      precedes the offset, as it does when in AT&T mode. */
4328   if (intel_syntax
4329       && i.operands > 1
4330       && (strcmp (mnemonic, "bound") != 0)
4331       && (strcmp (mnemonic, "invlpga") != 0)
4332       && !(operand_type_check (i.types[0], imm)
4333            && operand_type_check (i.types[1], imm)))
4334     swap_operands ();
4335
4336   /* The order of the immediates should be reversed
4337      for 2 immediates extrq and insertq instructions */
4338   if (i.imm_operands == 2
4339       && (strcmp (mnemonic, "extrq") == 0
4340           || strcmp (mnemonic, "insertq") == 0))
4341       swap_2_operands (0, 1);
4342
4343   if (i.imm_operands)
4344     optimize_imm ();
4345
4346   /* Don't optimize displacement for movabs since it only takes 64bit
4347      displacement.  */
4348   if (i.disp_operands
4349       && i.disp_encoding != disp_encoding_32bit
4350       && (flag_code != CODE_64BIT
4351           || strcmp (mnemonic, "movabs") != 0))
4352     optimize_disp ();
4353
4354   /* Next, we find a template that matches the given insn,
4355      making sure the overlap of the given operands types is consistent
4356      with the template operand types.  */
4357
4358   if (!(t = match_template (mnem_suffix)))
4359     return;
4360
4361   if (sse_check != check_none
4362       && !i.tm.opcode_modifier.noavx
4363       && !i.tm.cpu_flags.bitfield.cpuavx
4364       && !i.tm.cpu_flags.bitfield.cpuavx512f
4365       && (i.tm.cpu_flags.bitfield.cpusse
4366           || i.tm.cpu_flags.bitfield.cpusse2
4367           || i.tm.cpu_flags.bitfield.cpusse3
4368           || i.tm.cpu_flags.bitfield.cpussse3
4369           || i.tm.cpu_flags.bitfield.cpusse4_1
4370           || i.tm.cpu_flags.bitfield.cpusse4_2
4371           || i.tm.cpu_flags.bitfield.cpusse4a
4372           || i.tm.cpu_flags.bitfield.cpupclmul
4373           || i.tm.cpu_flags.bitfield.cpuaes
4374           || i.tm.cpu_flags.bitfield.cpusha
4375           || i.tm.cpu_flags.bitfield.cpugfni))
4376     {
4377       (sse_check == check_warning
4378        ? as_warn
4379        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4380     }
4381
4382   /* Zap movzx and movsx suffix.  The suffix has been set from
4383      "word ptr" or "byte ptr" on the source operand in Intel syntax
4384      or extracted from mnemonic in AT&T syntax.  But we'll use
4385      the destination register to choose the suffix for encoding.  */
4386   if ((i.tm.base_opcode & ~9) == 0x0fb6)
4387     {
4388       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
4389          there is no suffix, the default will be byte extension.  */
4390       if (i.reg_operands != 2
4391           && !i.suffix
4392           && intel_syntax)
4393         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4394
4395       i.suffix = 0;
4396     }
4397
4398   if (i.tm.opcode_modifier.fwait)
4399     if (!add_prefix (FWAIT_OPCODE))
4400       return;
4401
4402   /* Check if REP prefix is OK.  */
4403   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4404     {
4405       as_bad (_("invalid instruction `%s' after `%s'"),
4406                 i.tm.name, i.rep_prefix);
4407       return;
4408     }
4409
4410   /* Check for lock without a lockable instruction.  Destination operand
4411      must be memory unless it is xchg (0x86).  */
4412   if (i.prefix[LOCK_PREFIX]
4413       && (!i.tm.opcode_modifier.islockable
4414           || i.mem_operands == 0
4415           || (i.tm.base_opcode != 0x86
4416               && !(i.flags[i.operands - 1] & Operand_Mem))))
4417     {
4418       as_bad (_("expecting lockable instruction after `lock'"));
4419       return;
4420     }
4421
4422   /* Check for data size prefix on VEX/XOP/EVEX encoded insns.  */
4423   if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4424     {
4425       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4426       return;
4427     }
4428
4429   /* Check if HLE prefix is OK.  */
4430   if (i.hle_prefix && !check_hle ())
4431     return;
4432
4433   /* Check BND prefix.  */
4434   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4435     as_bad (_("expecting valid branch instruction after `bnd'"));
4436
4437   /* Check NOTRACK prefix.  */
4438   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4439     as_bad (_("expecting indirect branch instruction after `notrack'"));
4440
4441   if (i.tm.cpu_flags.bitfield.cpumpx)
4442     {
4443       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4444         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4445       else if (flag_code != CODE_16BIT
4446                ? i.prefix[ADDR_PREFIX]
4447                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4448         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4449     }
4450
4451   /* Insert BND prefix.  */
4452   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4453     {
4454       if (!i.prefix[BND_PREFIX])
4455         add_prefix (BND_PREFIX_OPCODE);
4456       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4457         {
4458           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4459           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4460         }
4461     }
4462
4463   /* Check string instruction segment overrides.  */
4464   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4465     {
4466       gas_assert (i.mem_operands);
4467       if (!check_string ())
4468         return;
4469       i.disp_operands = 0;
4470     }
4471
4472   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4473     optimize_encoding ();
4474
4475   if (!process_suffix ())
4476     return;
4477
4478   /* Update operand types.  */
4479   for (j = 0; j < i.operands; j++)
4480     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4481
4482   /* Make still unresolved immediate matches conform to size of immediate
4483      given in i.suffix.  */
4484   if (!finalize_imm ())
4485     return;
4486
4487   if (i.types[0].bitfield.imm1)
4488     i.imm_operands = 0; /* kludge for shift insns.  */
4489
4490   /* We only need to check those implicit registers for instructions
4491      with 3 operands or less.  */
4492   if (i.operands <= 3)
4493     for (j = 0; j < i.operands; j++)
4494       if (i.types[j].bitfield.instance != InstanceNone
4495           && !i.types[j].bitfield.xmmword)
4496         i.reg_operands--;
4497
4498   /* ImmExt should be processed after SSE2AVX.  */
4499   if (!i.tm.opcode_modifier.sse2avx
4500       && i.tm.opcode_modifier.immext)
4501     process_immext ();
4502
4503   /* For insns with operands there are more diddles to do to the opcode.  */
4504   if (i.operands)
4505     {
4506       if (!process_operands ())
4507         return;
4508     }
4509   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4510     {
4511       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4512       as_warn (_("translating to `%sp'"), i.tm.name);
4513     }
4514
4515   if (is_any_vex_encoding (&i.tm))
4516     {
4517       if (!cpu_arch_flags.bitfield.cpui286)
4518         {
4519           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4520                   i.tm.name);
4521           return;
4522         }
4523
4524       if (i.tm.opcode_modifier.vex)
4525         build_vex_prefix (t);
4526       else
4527         build_evex_prefix ();
4528     }
4529
4530   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4531      instructions may define INT_OPCODE as well, so avoid this corner
4532      case for those instructions that use MODRM.  */
4533   if (i.tm.base_opcode == INT_OPCODE
4534       && !i.tm.opcode_modifier.modrm
4535       && i.op[0].imms->X_add_number == 3)
4536     {
4537       i.tm.base_opcode = INT3_OPCODE;
4538       i.imm_operands = 0;
4539     }
4540
4541   if ((i.tm.opcode_modifier.jump == JUMP
4542        || i.tm.opcode_modifier.jump == JUMP_BYTE
4543        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4544       && i.op[0].disps->X_op == O_constant)
4545     {
4546       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4547          the absolute address given by the constant.  Since ix86 jumps and
4548          calls are pc relative, we need to generate a reloc.  */
4549       i.op[0].disps->X_add_symbol = &abs_symbol;
4550       i.op[0].disps->X_op = O_symbol;
4551     }
4552
4553   if (i.tm.opcode_modifier.rex64)
4554     i.rex |= REX_W;
4555
4556   /* For 8 bit registers we need an empty rex prefix.  Also if the
4557      instruction already has a prefix, we need to convert old
4558      registers to new ones.  */
4559
4560   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4561        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4562       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4563           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4564       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4565            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4566           && i.rex != 0))
4567     {
4568       int x;
4569
4570       i.rex |= REX_OPCODE;
4571       for (x = 0; x < 2; x++)
4572         {
4573           /* Look for 8 bit operand that uses old registers.  */
4574           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4575               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4576             {
4577               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4578               /* In case it is "hi" register, give up.  */
4579               if (i.op[x].regs->reg_num > 3)
4580                 as_bad (_("can't encode register '%s%s' in an "
4581                           "instruction requiring REX prefix."),
4582                         register_prefix, i.op[x].regs->reg_name);
4583
4584               /* Otherwise it is equivalent to the extended register.
4585                  Since the encoding doesn't change this is merely
4586                  cosmetic cleanup for debug output.  */
4587
4588               i.op[x].regs = i.op[x].regs + 8;
4589             }
4590         }
4591     }
4592
4593   if (i.rex == 0 && i.rex_encoding)
4594     {
4595       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4596          that uses legacy register.  If it is "hi" register, don't add
4597          the REX_OPCODE byte.  */
4598       int x;
4599       for (x = 0; x < 2; x++)
4600         if (i.types[x].bitfield.class == Reg
4601             && i.types[x].bitfield.byte
4602             && (i.op[x].regs->reg_flags & RegRex64) == 0
4603             && i.op[x].regs->reg_num > 3)
4604           {
4605             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4606             i.rex_encoding = FALSE;
4607             break;
4608           }
4609
4610       if (i.rex_encoding)
4611         i.rex = REX_OPCODE;
4612     }
4613
4614   if (i.rex != 0)
4615     add_prefix (REX_OPCODE | i.rex);
4616
4617   /* We are ready to output the insn.  */
4618   output_insn ();
4619
4620   last_insn.seg = now_seg;
4621
4622   if (i.tm.opcode_modifier.isprefix)
4623     {
4624       last_insn.kind = last_insn_prefix;
4625       last_insn.name = i.tm.name;
4626       last_insn.file = as_where (&last_insn.line);
4627     }
4628   else
4629     last_insn.kind = last_insn_other;
4630 }
4631
4632 static char *
4633 parse_insn (char *line, char *mnemonic)
4634 {
4635   char *l = line;
4636   char *token_start = l;
4637   char *mnem_p;
4638   int supported;
4639   const insn_template *t;
4640   char *dot_p = NULL;
4641
4642   while (1)
4643     {
4644       mnem_p = mnemonic;
4645       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4646         {
4647           if (*mnem_p == '.')
4648             dot_p = mnem_p;
4649           mnem_p++;
4650           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4651             {
4652               as_bad (_("no such instruction: `%s'"), token_start);
4653               return NULL;
4654             }
4655           l++;
4656         }
4657       if (!is_space_char (*l)
4658           && *l != END_OF_INSN
4659           && (intel_syntax
4660               || (*l != PREFIX_SEPARATOR
4661                   && *l != ',')))
4662         {
4663           as_bad (_("invalid character %s in mnemonic"),
4664                   output_invalid (*l));
4665           return NULL;
4666         }
4667       if (token_start == l)
4668         {
4669           if (!intel_syntax && *l == PREFIX_SEPARATOR)
4670             as_bad (_("expecting prefix; got nothing"));
4671           else
4672             as_bad (_("expecting mnemonic; got nothing"));
4673           return NULL;
4674         }
4675
4676       /* Look up instruction (or prefix) via hash table.  */
4677       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4678
4679       if (*l != END_OF_INSN
4680           && (!is_space_char (*l) || l[1] != END_OF_INSN)
4681           && current_templates
4682           && current_templates->start->opcode_modifier.isprefix)
4683         {
4684           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4685             {
4686               as_bad ((flag_code != CODE_64BIT
4687                        ? _("`%s' is only supported in 64-bit mode")
4688                        : _("`%s' is not supported in 64-bit mode")),
4689                       current_templates->start->name);
4690               return NULL;
4691             }
4692           /* If we are in 16-bit mode, do not allow addr16 or data16.
4693              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
4694           if ((current_templates->start->opcode_modifier.size == SIZE16
4695                || current_templates->start->opcode_modifier.size == SIZE32)
4696               && flag_code != CODE_64BIT
4697               && ((current_templates->start->opcode_modifier.size == SIZE32)
4698                   ^ (flag_code == CODE_16BIT)))
4699             {
4700               as_bad (_("redundant %s prefix"),
4701                       current_templates->start->name);
4702               return NULL;
4703             }
4704           if (current_templates->start->opcode_length == 0)
4705             {
4706               /* Handle pseudo prefixes.  */
4707               switch (current_templates->start->base_opcode)
4708                 {
4709                 case 0x0:
4710                   /* {disp8} */
4711                   i.disp_encoding = disp_encoding_8bit;
4712                   break;
4713                 case 0x1:
4714                   /* {disp32} */
4715                   i.disp_encoding = disp_encoding_32bit;
4716                   break;
4717                 case 0x2:
4718                   /* {load} */
4719                   i.dir_encoding = dir_encoding_load;
4720                   break;
4721                 case 0x3:
4722                   /* {store} */
4723                   i.dir_encoding = dir_encoding_store;
4724                   break;
4725                 case 0x4:
4726                   /* {vex} */
4727                   i.vec_encoding = vex_encoding_vex;
4728                   break;
4729                 case 0x5:
4730                   /* {vex3} */
4731                   i.vec_encoding = vex_encoding_vex3;
4732                   break;
4733                 case 0x6:
4734                   /* {evex} */
4735                   i.vec_encoding = vex_encoding_evex;
4736                   break;
4737                 case 0x7:
4738                   /* {rex} */
4739                   i.rex_encoding = TRUE;
4740                   break;
4741                 case 0x8:
4742                   /* {nooptimize} */
4743                   i.no_optimize = TRUE;
4744                   break;
4745                 default:
4746                   abort ();
4747                 }
4748             }
4749           else
4750             {
4751               /* Add prefix, checking for repeated prefixes.  */
4752               switch (add_prefix (current_templates->start->base_opcode))
4753                 {
4754                 case PREFIX_EXIST:
4755                   return NULL;
4756                 case PREFIX_DS:
4757                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
4758                     i.notrack_prefix = current_templates->start->name;
4759                   break;
4760                 case PREFIX_REP:
4761                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
4762                     i.hle_prefix = current_templates->start->name;
4763                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4764                     i.bnd_prefix = current_templates->start->name;
4765                   else
4766                     i.rep_prefix = current_templates->start->name;
4767                   break;
4768                 default:
4769                   break;
4770                 }
4771             }
4772           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
4773           token_start = ++l;
4774         }
4775       else
4776         break;
4777     }
4778
4779   if (!current_templates)
4780     {
4781       /* Deprecated functionality (new code should use pseudo-prefixes instead):
4782          Check if we should swap operand or force 32bit displacement in
4783          encoding.  */
4784       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4785         i.dir_encoding = dir_encoding_swap;
4786       else if (mnem_p - 3 == dot_p
4787                && dot_p[1] == 'd'
4788                && dot_p[2] == '8')
4789         i.disp_encoding = disp_encoding_8bit;
4790       else if (mnem_p - 4 == dot_p
4791                && dot_p[1] == 'd'
4792                && dot_p[2] == '3'
4793                && dot_p[3] == '2')
4794         i.disp_encoding = disp_encoding_32bit;
4795       else
4796         goto check_suffix;
4797       mnem_p = dot_p;
4798       *dot_p = '\0';
4799       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4800     }
4801
4802   if (!current_templates)
4803     {
4804 check_suffix:
4805       if (mnem_p > mnemonic)
4806         {
4807           /* See if we can get a match by trimming off a suffix.  */
4808           switch (mnem_p[-1])
4809             {
4810             case WORD_MNEM_SUFFIX:
4811               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4812                 i.suffix = SHORT_MNEM_SUFFIX;
4813               else
4814                 /* Fall through.  */
4815               case BYTE_MNEM_SUFFIX:
4816               case QWORD_MNEM_SUFFIX:
4817                 i.suffix = mnem_p[-1];
4818               mnem_p[-1] = '\0';
4819               current_templates = (const templates *) hash_find (op_hash,
4820                                                                  mnemonic);
4821               break;
4822             case SHORT_MNEM_SUFFIX:
4823             case LONG_MNEM_SUFFIX:
4824               if (!intel_syntax)
4825                 {
4826                   i.suffix = mnem_p[-1];
4827                   mnem_p[-1] = '\0';
4828                   current_templates = (const templates *) hash_find (op_hash,
4829                                                                      mnemonic);
4830                 }
4831               break;
4832
4833               /* Intel Syntax.  */
4834             case 'd':
4835               if (intel_syntax)
4836                 {
4837                   if (intel_float_operand (mnemonic) == 1)
4838                     i.suffix = SHORT_MNEM_SUFFIX;
4839                   else
4840                     i.suffix = LONG_MNEM_SUFFIX;
4841                   mnem_p[-1] = '\0';
4842                   current_templates = (const templates *) hash_find (op_hash,
4843                                                                      mnemonic);
4844                 }
4845               break;
4846             }
4847         }
4848
4849       if (!current_templates)
4850         {
4851           as_bad (_("no such instruction: `%s'"), token_start);
4852           return NULL;
4853         }
4854     }
4855
4856   if (current_templates->start->opcode_modifier.jump == JUMP
4857       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4858     {
4859       /* Check for a branch hint.  We allow ",pt" and ",pn" for
4860          predict taken and predict not taken respectively.
4861          I'm not sure that branch hints actually do anything on loop
4862          and jcxz insns (JumpByte) for current Pentium4 chips.  They
4863          may work in the future and it doesn't hurt to accept them
4864          now.  */
4865       if (l[0] == ',' && l[1] == 'p')
4866         {
4867           if (l[2] == 't')
4868             {
4869               if (!add_prefix (DS_PREFIX_OPCODE))
4870                 return NULL;
4871               l += 3;
4872             }
4873           else if (l[2] == 'n')
4874             {
4875               if (!add_prefix (CS_PREFIX_OPCODE))
4876                 return NULL;
4877               l += 3;
4878             }
4879         }
4880     }
4881   /* Any other comma loses.  */
4882   if (*l == ',')
4883     {
4884       as_bad (_("invalid character %s in mnemonic"),
4885               output_invalid (*l));
4886       return NULL;
4887     }
4888
4889   /* Check if instruction is supported on specified architecture.  */
4890   supported = 0;
4891   for (t = current_templates->start; t < current_templates->end; ++t)
4892     {
4893       supported |= cpu_flags_match (t);
4894       if (supported == CPU_FLAGS_PERFECT_MATCH)
4895         {
4896           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4897             as_warn (_("use .code16 to ensure correct addressing mode"));
4898
4899           return l;
4900         }
4901     }
4902
4903   if (!(supported & CPU_FLAGS_64BIT_MATCH))
4904     as_bad (flag_code == CODE_64BIT
4905             ? _("`%s' is not supported in 64-bit mode")
4906             : _("`%s' is only supported in 64-bit mode"),
4907             current_templates->start->name);
4908   else
4909     as_bad (_("`%s' is not supported on `%s%s'"),
4910             current_templates->start->name,
4911             cpu_arch_name ? cpu_arch_name : default_arch,
4912             cpu_sub_arch_name ? cpu_sub_arch_name : "");
4913
4914   return NULL;
4915 }
4916
4917 static char *
4918 parse_operands (char *l, const char *mnemonic)
4919 {
4920   char *token_start;
4921
4922   /* 1 if operand is pending after ','.  */
4923   unsigned int expecting_operand = 0;
4924
4925   /* Non-zero if operand parens not balanced.  */
4926   unsigned int paren_not_balanced;
4927
4928   while (*l != END_OF_INSN)
4929     {
4930       /* Skip optional white space before operand.  */
4931       if (is_space_char (*l))
4932         ++l;
4933       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4934         {
4935           as_bad (_("invalid character %s before operand %d"),
4936                   output_invalid (*l),
4937                   i.operands + 1);
4938           return NULL;
4939         }
4940       token_start = l;  /* After white space.  */
4941       paren_not_balanced = 0;
4942       while (paren_not_balanced || *l != ',')
4943         {
4944           if (*l == END_OF_INSN)
4945             {
4946               if (paren_not_balanced)
4947                 {
4948                   if (!intel_syntax)
4949                     as_bad (_("unbalanced parenthesis in operand %d."),
4950                             i.operands + 1);
4951                   else
4952                     as_bad (_("unbalanced brackets in operand %d."),
4953                             i.operands + 1);
4954                   return NULL;
4955                 }
4956               else
4957                 break;  /* we are done */
4958             }
4959           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4960             {
4961               as_bad (_("invalid character %s in operand %d"),
4962                       output_invalid (*l),
4963                       i.operands + 1);
4964               return NULL;
4965             }
4966           if (!intel_syntax)
4967             {
4968               if (*l == '(')
4969                 ++paren_not_balanced;
4970               if (*l == ')')
4971                 --paren_not_balanced;
4972             }
4973           else
4974             {
4975               if (*l == '[')
4976                 ++paren_not_balanced;
4977               if (*l == ']')
4978                 --paren_not_balanced;
4979             }
4980           l++;
4981         }
4982       if (l != token_start)
4983         {                       /* Yes, we've read in another operand.  */
4984           unsigned int operand_ok;
4985           this_operand = i.operands++;
4986           if (i.operands > MAX_OPERANDS)
4987             {
4988               as_bad (_("spurious operands; (%d operands/instruction max)"),
4989                       MAX_OPERANDS);
4990               return NULL;
4991             }
4992           i.types[this_operand].bitfield.unspecified = 1;
4993           /* Now parse operand adding info to 'i' as we go along.  */
4994           END_STRING_AND_SAVE (l);
4995
4996           if (i.mem_operands > 1)
4997             {
4998               as_bad (_("too many memory references for `%s'"),
4999                       mnemonic);
5000               return 0;
5001             }
5002
5003           if (intel_syntax)
5004             operand_ok =
5005               i386_intel_operand (token_start,
5006                                   intel_float_operand (mnemonic));
5007           else
5008             operand_ok = i386_att_operand (token_start);
5009
5010           RESTORE_END_STRING (l);
5011           if (!operand_ok)
5012             return NULL;
5013         }
5014       else
5015         {
5016           if (expecting_operand)
5017             {
5018             expecting_operand_after_comma:
5019               as_bad (_("expecting operand after ','; got nothing"));
5020               return NULL;
5021             }
5022           if (*l == ',')
5023             {
5024               as_bad (_("expecting operand before ','; got nothing"));
5025               return NULL;
5026             }
5027         }
5028
5029       /* Now *l must be either ',' or END_OF_INSN.  */
5030       if (*l == ',')
5031         {
5032           if (*++l == END_OF_INSN)
5033             {
5034               /* Just skip it, if it's \n complain.  */
5035               goto expecting_operand_after_comma;
5036             }
5037           expecting_operand = 1;
5038         }
5039     }
5040   return l;
5041 }
5042
5043 static void
5044 swap_2_operands (int xchg1, int xchg2)
5045 {
5046   union i386_op temp_op;
5047   i386_operand_type temp_type;
5048   unsigned int temp_flags;
5049   enum bfd_reloc_code_real temp_reloc;
5050
5051   temp_type = i.types[xchg2];
5052   i.types[xchg2] = i.types[xchg1];
5053   i.types[xchg1] = temp_type;
5054
5055   temp_flags = i.flags[xchg2];
5056   i.flags[xchg2] = i.flags[xchg1];
5057   i.flags[xchg1] = temp_flags;
5058
5059   temp_op = i.op[xchg2];
5060   i.op[xchg2] = i.op[xchg1];
5061   i.op[xchg1] = temp_op;
5062
5063   temp_reloc = i.reloc[xchg2];
5064   i.reloc[xchg2] = i.reloc[xchg1];
5065   i.reloc[xchg1] = temp_reloc;
5066
5067   if (i.mask)
5068     {
5069       if (i.mask->operand == xchg1)
5070         i.mask->operand = xchg2;
5071       else if (i.mask->operand == xchg2)
5072         i.mask->operand = xchg1;
5073     }
5074   if (i.broadcast)
5075     {
5076       if (i.broadcast->operand == xchg1)
5077         i.broadcast->operand = xchg2;
5078       else if (i.broadcast->operand == xchg2)
5079         i.broadcast->operand = xchg1;
5080     }
5081   if (i.rounding)
5082     {
5083       if (i.rounding->operand == xchg1)
5084         i.rounding->operand = xchg2;
5085       else if (i.rounding->operand == xchg2)
5086         i.rounding->operand = xchg1;
5087     }
5088 }
5089
5090 static void
5091 swap_operands (void)
5092 {
5093   switch (i.operands)
5094     {
5095     case 5:
5096     case 4:
5097       swap_2_operands (1, i.operands - 2);
5098       /* Fall through.  */
5099     case 3:
5100     case 2:
5101       swap_2_operands (0, i.operands - 1);
5102       break;
5103     default:
5104       abort ();
5105     }
5106
5107   if (i.mem_operands == 2)
5108     {
5109       const seg_entry *temp_seg;
5110       temp_seg = i.seg[0];
5111       i.seg[0] = i.seg[1];
5112       i.seg[1] = temp_seg;
5113     }
5114 }
5115
5116 /* Try to ensure constant immediates are represented in the smallest
5117    opcode possible.  */
5118 static void
5119 optimize_imm (void)
5120 {
5121   char guess_suffix = 0;
5122   int op;
5123
5124   if (i.suffix)
5125     guess_suffix = i.suffix;
5126   else if (i.reg_operands)
5127     {
5128       /* Figure out a suffix from the last register operand specified.
5129          We can't do this properly yet, i.e. excluding special register
5130          instances, but the following works for instructions with
5131          immediates.  In any case, we can't set i.suffix yet.  */
5132       for (op = i.operands; --op >= 0;)
5133         if (i.types[op].bitfield.class != Reg)
5134           continue;
5135         else if (i.types[op].bitfield.byte)
5136           {
5137             guess_suffix = BYTE_MNEM_SUFFIX;
5138             break;
5139           }
5140         else if (i.types[op].bitfield.word)
5141           {
5142             guess_suffix = WORD_MNEM_SUFFIX;
5143             break;
5144           }
5145         else if (i.types[op].bitfield.dword)
5146           {
5147             guess_suffix = LONG_MNEM_SUFFIX;
5148             break;
5149           }
5150         else if (i.types[op].bitfield.qword)
5151           {
5152             guess_suffix = QWORD_MNEM_SUFFIX;
5153             break;
5154           }
5155     }
5156   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5157     guess_suffix = WORD_MNEM_SUFFIX;
5158
5159   for (op = i.operands; --op >= 0;)
5160     if (operand_type_check (i.types[op], imm))
5161       {
5162         switch (i.op[op].imms->X_op)
5163           {
5164           case O_constant:
5165             /* If a suffix is given, this operand may be shortened.  */
5166             switch (guess_suffix)
5167               {
5168               case LONG_MNEM_SUFFIX:
5169                 i.types[op].bitfield.imm32 = 1;
5170                 i.types[op].bitfield.imm64 = 1;
5171                 break;
5172               case WORD_MNEM_SUFFIX:
5173                 i.types[op].bitfield.imm16 = 1;
5174                 i.types[op].bitfield.imm32 = 1;
5175                 i.types[op].bitfield.imm32s = 1;
5176                 i.types[op].bitfield.imm64 = 1;
5177                 break;
5178               case BYTE_MNEM_SUFFIX:
5179                 i.types[op].bitfield.imm8 = 1;
5180                 i.types[op].bitfield.imm8s = 1;
5181                 i.types[op].bitfield.imm16 = 1;
5182                 i.types[op].bitfield.imm32 = 1;
5183                 i.types[op].bitfield.imm32s = 1;
5184                 i.types[op].bitfield.imm64 = 1;
5185                 break;
5186               }
5187
5188             /* If this operand is at most 16 bits, convert it
5189                to a signed 16 bit number before trying to see
5190                whether it will fit in an even smaller size.
5191                This allows a 16-bit operand such as $0xffe0 to
5192                be recognised as within Imm8S range.  */
5193             if ((i.types[op].bitfield.imm16)
5194                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5195               {
5196                 i.op[op].imms->X_add_number =
5197                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5198               }
5199 #ifdef BFD64
5200             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5201             if ((i.types[op].bitfield.imm32)
5202                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5203                     == 0))
5204               {
5205                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5206                                                 ^ ((offsetT) 1 << 31))
5207                                                - ((offsetT) 1 << 31));
5208               }
5209 #endif
5210             i.types[op]
5211               = operand_type_or (i.types[op],
5212                                  smallest_imm_type (i.op[op].imms->X_add_number));
5213
5214             /* We must avoid matching of Imm32 templates when 64bit
5215                only immediate is available.  */
5216             if (guess_suffix == QWORD_MNEM_SUFFIX)
5217               i.types[op].bitfield.imm32 = 0;
5218             break;
5219
5220           case O_absent:
5221           case O_register:
5222             abort ();
5223
5224             /* Symbols and expressions.  */
5225           default:
5226             /* Convert symbolic operand to proper sizes for matching, but don't
5227                prevent matching a set of insns that only supports sizes other
5228                than those matching the insn suffix.  */
5229             {
5230               i386_operand_type mask, allowed;
5231               const insn_template *t;
5232
5233               operand_type_set (&mask, 0);
5234               operand_type_set (&allowed, 0);
5235
5236               for (t = current_templates->start;
5237                    t < current_templates->end;
5238                    ++t)
5239                 {
5240                   allowed = operand_type_or (allowed, t->operand_types[op]);
5241                   allowed = operand_type_and (allowed, anyimm);
5242                 }
5243               switch (guess_suffix)
5244                 {
5245                 case QWORD_MNEM_SUFFIX:
5246                   mask.bitfield.imm64 = 1;
5247                   mask.bitfield.imm32s = 1;
5248                   break;
5249                 case LONG_MNEM_SUFFIX:
5250                   mask.bitfield.imm32 = 1;
5251                   break;
5252                 case WORD_MNEM_SUFFIX:
5253                   mask.bitfield.imm16 = 1;
5254                   break;
5255                 case BYTE_MNEM_SUFFIX:
5256                   mask.bitfield.imm8 = 1;
5257                   break;
5258                 default:
5259                   break;
5260                 }
5261               allowed = operand_type_and (mask, allowed);
5262               if (!operand_type_all_zero (&allowed))
5263                 i.types[op] = operand_type_and (i.types[op], mask);
5264             }
5265             break;
5266           }
5267       }
5268 }
5269
5270 /* Try to use the smallest displacement type too.  */
5271 static void
5272 optimize_disp (void)
5273 {
5274   int op;
5275
5276   for (op = i.operands; --op >= 0;)
5277     if (operand_type_check (i.types[op], disp))
5278       {
5279         if (i.op[op].disps->X_op == O_constant)
5280           {
5281             offsetT op_disp = i.op[op].disps->X_add_number;
5282
5283             if (i.types[op].bitfield.disp16
5284                 && (op_disp & ~(offsetT) 0xffff) == 0)
5285               {
5286                 /* If this operand is at most 16 bits, convert
5287                    to a signed 16 bit number and don't use 64bit
5288                    displacement.  */
5289                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5290                 i.types[op].bitfield.disp64 = 0;
5291               }
5292 #ifdef BFD64
5293             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5294             if (i.types[op].bitfield.disp32
5295                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5296               {
5297                 /* If this operand is at most 32 bits, convert
5298                    to a signed 32 bit number and don't use 64bit
5299                    displacement.  */
5300                 op_disp &= (((offsetT) 2 << 31) - 1);
5301                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5302                 i.types[op].bitfield.disp64 = 0;
5303               }
5304 #endif
5305             if (!op_disp && i.types[op].bitfield.baseindex)
5306               {
5307                 i.types[op].bitfield.disp8 = 0;
5308                 i.types[op].bitfield.disp16 = 0;
5309                 i.types[op].bitfield.disp32 = 0;
5310                 i.types[op].bitfield.disp32s = 0;
5311                 i.types[op].bitfield.disp64 = 0;
5312                 i.op[op].disps = 0;
5313                 i.disp_operands--;
5314               }
5315             else if (flag_code == CODE_64BIT)
5316               {
5317                 if (fits_in_signed_long (op_disp))
5318                   {
5319                     i.types[op].bitfield.disp64 = 0;
5320                     i.types[op].bitfield.disp32s = 1;
5321                   }
5322                 if (i.prefix[ADDR_PREFIX]
5323                     && fits_in_unsigned_long (op_disp))
5324                   i.types[op].bitfield.disp32 = 1;
5325               }
5326             if ((i.types[op].bitfield.disp32
5327                  || i.types[op].bitfield.disp32s
5328                  || i.types[op].bitfield.disp16)
5329                 && fits_in_disp8 (op_disp))
5330               i.types[op].bitfield.disp8 = 1;
5331           }
5332         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5333                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5334           {
5335             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5336                          i.op[op].disps, 0, i.reloc[op]);
5337             i.types[op].bitfield.disp8 = 0;
5338             i.types[op].bitfield.disp16 = 0;
5339             i.types[op].bitfield.disp32 = 0;
5340             i.types[op].bitfield.disp32s = 0;
5341             i.types[op].bitfield.disp64 = 0;
5342           }
5343         else
5344           /* We only support 64bit displacement on constants.  */
5345           i.types[op].bitfield.disp64 = 0;
5346       }
5347 }
5348
5349 /* Return 1 if there is a match in broadcast bytes between operand
5350    GIVEN and instruction template T.   */
5351
5352 static INLINE int
5353 match_broadcast_size (const insn_template *t, unsigned int given)
5354 {
5355   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5356            && i.types[given].bitfield.byte)
5357           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5358               && i.types[given].bitfield.word)
5359           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5360               && i.types[given].bitfield.dword)
5361           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5362               && i.types[given].bitfield.qword));
5363 }
5364
5365 /* Check if operands are valid for the instruction.  */
5366
5367 static int
5368 check_VecOperands (const insn_template *t)
5369 {
5370   unsigned int op;
5371   i386_cpu_flags cpu;
5372
5373   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5374      any one operand are implicity requiring AVX512VL support if the actual
5375      operand size is YMMword or XMMword.  Since this function runs after
5376      template matching, there's no need to check for YMMword/XMMword in
5377      the template.  */
5378   cpu = cpu_flags_and (t->cpu_flags, avx512);
5379   if (!cpu_flags_all_zero (&cpu)
5380       && !t->cpu_flags.bitfield.cpuavx512vl
5381       && !cpu_arch_flags.bitfield.cpuavx512vl)
5382     {
5383       for (op = 0; op < t->operands; ++op)
5384         {
5385           if (t->operand_types[op].bitfield.zmmword
5386               && (i.types[op].bitfield.ymmword
5387                   || i.types[op].bitfield.xmmword))
5388             {
5389               i.error = unsupported;
5390               return 1;
5391             }
5392         }
5393     }
5394
5395   /* Without VSIB byte, we can't have a vector register for index.  */
5396   if (!t->opcode_modifier.vecsib
5397       && i.index_reg
5398       && (i.index_reg->reg_type.bitfield.xmmword
5399           || i.index_reg->reg_type.bitfield.ymmword
5400           || i.index_reg->reg_type.bitfield.zmmword))
5401     {
5402       i.error = unsupported_vector_index_register;
5403       return 1;
5404     }
5405
5406   /* Check if default mask is allowed.  */
5407   if (t->opcode_modifier.nodefmask
5408       && (!i.mask || i.mask->mask->reg_num == 0))
5409     {
5410       i.error = no_default_mask;
5411       return 1;
5412     }
5413
5414   /* For VSIB byte, we need a vector register for index, and all vector
5415      registers must be distinct.  */
5416   if (t->opcode_modifier.vecsib)
5417     {
5418       if (!i.index_reg
5419           || !((t->opcode_modifier.vecsib == VecSIB128
5420                 && i.index_reg->reg_type.bitfield.xmmword)
5421                || (t->opcode_modifier.vecsib == VecSIB256
5422                    && i.index_reg->reg_type.bitfield.ymmword)
5423                || (t->opcode_modifier.vecsib == VecSIB512
5424                    && i.index_reg->reg_type.bitfield.zmmword)))
5425       {
5426         i.error = invalid_vsib_address;
5427         return 1;
5428       }
5429
5430       gas_assert (i.reg_operands == 2 || i.mask);
5431       if (i.reg_operands == 2 && !i.mask)
5432         {
5433           gas_assert (i.types[0].bitfield.class == RegSIMD);
5434           gas_assert (i.types[0].bitfield.xmmword
5435                       || i.types[0].bitfield.ymmword);
5436           gas_assert (i.types[2].bitfield.class == RegSIMD);
5437           gas_assert (i.types[2].bitfield.xmmword
5438                       || i.types[2].bitfield.ymmword);
5439           if (operand_check == check_none)
5440             return 0;
5441           if (register_number (i.op[0].regs)
5442               != register_number (i.index_reg)
5443               && register_number (i.op[2].regs)
5444                  != register_number (i.index_reg)
5445               && register_number (i.op[0].regs)
5446                  != register_number (i.op[2].regs))
5447             return 0;
5448           if (operand_check == check_error)
5449             {
5450               i.error = invalid_vector_register_set;
5451               return 1;
5452             }
5453           as_warn (_("mask, index, and destination registers should be distinct"));
5454         }
5455       else if (i.reg_operands == 1 && i.mask)
5456         {
5457           if (i.types[1].bitfield.class == RegSIMD
5458               && (i.types[1].bitfield.xmmword
5459                   || i.types[1].bitfield.ymmword
5460                   || i.types[1].bitfield.zmmword)
5461               && (register_number (i.op[1].regs)
5462                   == register_number (i.index_reg)))
5463             {
5464               if (operand_check == check_error)
5465                 {
5466                   i.error = invalid_vector_register_set;
5467                   return 1;
5468                 }
5469               if (operand_check != check_none)
5470                 as_warn (_("index and destination registers should be distinct"));
5471             }
5472         }
5473     }
5474
5475   /* Check if broadcast is supported by the instruction and is applied
5476      to the memory operand.  */
5477   if (i.broadcast)
5478     {
5479       i386_operand_type type, overlap;
5480
5481       /* Check if specified broadcast is supported in this instruction,
5482          and its broadcast bytes match the memory operand.  */
5483       op = i.broadcast->operand;
5484       if (!t->opcode_modifier.broadcast
5485           || !(i.flags[op] & Operand_Mem)
5486           || (!i.types[op].bitfield.unspecified
5487               && !match_broadcast_size (t, op)))
5488         {
5489         bad_broadcast:
5490           i.error = unsupported_broadcast;
5491           return 1;
5492         }
5493
5494       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5495                             * i.broadcast->type);
5496       operand_type_set (&type, 0);
5497       switch (i.broadcast->bytes)
5498         {
5499         case 2:
5500           type.bitfield.word = 1;
5501           break;
5502         case 4:
5503           type.bitfield.dword = 1;
5504           break;
5505         case 8:
5506           type.bitfield.qword = 1;
5507           break;
5508         case 16:
5509           type.bitfield.xmmword = 1;
5510           break;
5511         case 32:
5512           type.bitfield.ymmword = 1;
5513           break;
5514         case 64:
5515           type.bitfield.zmmword = 1;
5516           break;
5517         default:
5518           goto bad_broadcast;
5519         }
5520
5521       overlap = operand_type_and (type, t->operand_types[op]);
5522       if (operand_type_all_zero (&overlap))
5523           goto bad_broadcast;
5524
5525       if (t->opcode_modifier.checkregsize)
5526         {
5527           unsigned int j;
5528
5529           type.bitfield.baseindex = 1;
5530           for (j = 0; j < i.operands; ++j)
5531             {
5532               if (j != op
5533                   && !operand_type_register_match(i.types[j],
5534                                                   t->operand_types[j],
5535                                                   type,
5536                                                   t->operand_types[op]))
5537                 goto bad_broadcast;
5538             }
5539         }
5540     }
5541   /* If broadcast is supported in this instruction, we need to check if
5542      operand of one-element size isn't specified without broadcast.  */
5543   else if (t->opcode_modifier.broadcast && i.mem_operands)
5544     {
5545       /* Find memory operand.  */
5546       for (op = 0; op < i.operands; op++)
5547         if (i.flags[op] & Operand_Mem)
5548           break;
5549       gas_assert (op < i.operands);
5550       /* Check size of the memory operand.  */
5551       if (match_broadcast_size (t, op))
5552         {
5553           i.error = broadcast_needed;
5554           return 1;
5555         }
5556     }
5557   else
5558     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5559
5560   /* Check if requested masking is supported.  */
5561   if (i.mask)
5562     {
5563       switch (t->opcode_modifier.masking)
5564         {
5565         case BOTH_MASKING:
5566           break;
5567         case MERGING_MASKING:
5568           if (i.mask->zeroing)
5569             {
5570         case 0:
5571               i.error = unsupported_masking;
5572               return 1;
5573             }
5574           break;
5575         case DYNAMIC_MASKING:
5576           /* Memory destinations allow only merging masking.  */
5577           if (i.mask->zeroing && i.mem_operands)
5578             {
5579               /* Find memory operand.  */
5580               for (op = 0; op < i.operands; op++)
5581                 if (i.flags[op] & Operand_Mem)
5582                   break;
5583               gas_assert (op < i.operands);
5584               if (op == i.operands - 1)
5585                 {
5586                   i.error = unsupported_masking;
5587                   return 1;
5588                 }
5589             }
5590           break;
5591         default:
5592           abort ();
5593         }
5594     }
5595
5596   /* Check if masking is applied to dest operand.  */
5597   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5598     {
5599       i.error = mask_not_on_destination;
5600       return 1;
5601     }
5602
5603   /* Check RC/SAE.  */
5604   if (i.rounding)
5605     {
5606       if (!t->opcode_modifier.sae
5607           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5608         {
5609           i.error = unsupported_rc_sae;
5610           return 1;
5611         }
5612       /* If the instruction has several immediate operands and one of
5613          them is rounding, the rounding operand should be the last
5614          immediate operand.  */
5615       if (i.imm_operands > 1
5616           && i.rounding->operand != (int) (i.imm_operands - 1))
5617         {
5618           i.error = rc_sae_operand_not_last_imm;
5619           return 1;
5620         }
5621     }
5622
5623   /* Check vector Disp8 operand.  */
5624   if (t->opcode_modifier.disp8memshift
5625       && i.disp_encoding != disp_encoding_32bit)
5626     {
5627       if (i.broadcast)
5628         i.memshift = t->opcode_modifier.broadcast - 1;
5629       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5630         i.memshift = t->opcode_modifier.disp8memshift;
5631       else
5632         {
5633           const i386_operand_type *type = NULL;
5634
5635           i.memshift = 0;
5636           for (op = 0; op < i.operands; op++)
5637             if (i.flags[op] & Operand_Mem)
5638               {
5639                 if (t->opcode_modifier.evex == EVEXLIG)
5640                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5641                 else if (t->operand_types[op].bitfield.xmmword
5642                          + t->operand_types[op].bitfield.ymmword
5643                          + t->operand_types[op].bitfield.zmmword <= 1)
5644                   type = &t->operand_types[op];
5645                 else if (!i.types[op].bitfield.unspecified)
5646                   type = &i.types[op];
5647               }
5648             else if (i.types[op].bitfield.class == RegSIMD
5649                      && t->opcode_modifier.evex != EVEXLIG)
5650               {
5651                 if (i.types[op].bitfield.zmmword)
5652                   i.memshift = 6;
5653                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5654                   i.memshift = 5;
5655                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5656                   i.memshift = 4;
5657               }
5658
5659           if (type)
5660             {
5661               if (type->bitfield.zmmword)
5662                 i.memshift = 6;
5663               else if (type->bitfield.ymmword)
5664                 i.memshift = 5;
5665               else if (type->bitfield.xmmword)
5666                 i.memshift = 4;
5667             }
5668
5669           /* For the check in fits_in_disp8().  */
5670           if (i.memshift == 0)
5671             i.memshift = -1;
5672         }
5673
5674       for (op = 0; op < i.operands; op++)
5675         if (operand_type_check (i.types[op], disp)
5676             && i.op[op].disps->X_op == O_constant)
5677           {
5678             if (fits_in_disp8 (i.op[op].disps->X_add_number))
5679               {
5680                 i.types[op].bitfield.disp8 = 1;
5681                 return 0;
5682               }
5683             i.types[op].bitfield.disp8 = 0;
5684           }
5685     }
5686
5687   i.memshift = 0;
5688
5689   return 0;
5690 }
5691
5692 /* Check if operands are valid for the instruction.  Update VEX
5693    operand types.  */
5694
5695 static int
5696 VEX_check_operands (const insn_template *t)
5697 {
5698   if (i.vec_encoding == vex_encoding_evex)
5699     {
5700       /* This instruction must be encoded with EVEX prefix.  */
5701       if (!is_evex_encoding (t))
5702         {
5703           i.error = unsupported;
5704           return 1;
5705         }
5706       return 0;
5707     }
5708
5709   if (!t->opcode_modifier.vex)
5710     {
5711       /* This instruction template doesn't have VEX prefix.  */
5712       if (i.vec_encoding != vex_encoding_default)
5713         {
5714           i.error = unsupported;
5715           return 1;
5716         }
5717       return 0;
5718     }
5719
5720   /* Check the special Imm4 cases; must be the first operand.  */
5721   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5722     {
5723       if (i.op[0].imms->X_op != O_constant
5724           || !fits_in_imm4 (i.op[0].imms->X_add_number))
5725         {
5726           i.error = bad_imm4;
5727           return 1;
5728         }
5729
5730       /* Turn off Imm<N> so that update_imm won't complain.  */
5731       operand_type_set (&i.types[0], 0);
5732     }
5733
5734   return 0;
5735 }
5736
5737 static const insn_template *
5738 match_template (char mnem_suffix)
5739 {
5740   /* Points to template once we've found it.  */
5741   const insn_template *t;
5742   i386_operand_type overlap0, overlap1, overlap2, overlap3;
5743   i386_operand_type overlap4;
5744   unsigned int found_reverse_match;
5745   i386_opcode_modifier suffix_check;
5746   i386_operand_type operand_types [MAX_OPERANDS];
5747   int addr_prefix_disp;
5748   unsigned int j, size_match, check_register;
5749   enum i386_error specific_error = 0;
5750
5751 #if MAX_OPERANDS != 5
5752 # error "MAX_OPERANDS must be 5."
5753 #endif
5754
5755   found_reverse_match = 0;
5756   addr_prefix_disp = -1;
5757
5758   /* Prepare for mnemonic suffix check.  */
5759   memset (&suffix_check, 0, sizeof (suffix_check));
5760   switch (mnem_suffix)
5761     {
5762     case BYTE_MNEM_SUFFIX:
5763       suffix_check.no_bsuf = 1;
5764       break;
5765     case WORD_MNEM_SUFFIX:
5766       suffix_check.no_wsuf = 1;
5767       break;
5768     case SHORT_MNEM_SUFFIX:
5769       suffix_check.no_ssuf = 1;
5770       break;
5771     case LONG_MNEM_SUFFIX:
5772       suffix_check.no_lsuf = 1;
5773       break;
5774     case QWORD_MNEM_SUFFIX:
5775       suffix_check.no_qsuf = 1;
5776       break;
5777     default:
5778       /* NB: In Intel syntax, normally we can check for memory operand
5779          size when there is no mnemonic suffix.  But jmp and call have
5780          2 different encodings with Dword memory operand size, one with
5781          No_ldSuf and the other without.  i.suffix is set to
5782          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
5783       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5784         suffix_check.no_ldsuf = 1;
5785     }
5786
5787   /* Must have right number of operands.  */
5788   i.error = number_of_operands_mismatch;
5789
5790   for (t = current_templates->start; t < current_templates->end; t++)
5791     {
5792       addr_prefix_disp = -1;
5793       found_reverse_match = 0;
5794
5795       if (i.operands != t->operands)
5796         continue;
5797
5798       /* Check processor support.  */
5799       i.error = unsupported;
5800       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
5801         continue;
5802
5803       /* Check AT&T mnemonic.   */
5804       i.error = unsupported_with_intel_mnemonic;
5805       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5806         continue;
5807
5808       /* Check AT&T/Intel syntax.  */
5809       i.error = unsupported_syntax;
5810       if ((intel_syntax && t->opcode_modifier.attsyntax)
5811           || (!intel_syntax && t->opcode_modifier.intelsyntax))
5812         continue;
5813
5814       /* Check Intel64/AMD64 ISA.   */
5815       switch (isa64)
5816         {
5817         default:
5818           /* Default: Don't accept Intel64.  */
5819           if (t->opcode_modifier.isa64 == INTEL64)
5820             continue;
5821           break;
5822         case amd64:
5823           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
5824           if (t->opcode_modifier.isa64 >= INTEL64)
5825             continue;
5826           break;
5827         case intel64:
5828           /* -mintel64: Don't accept AMD64.  */
5829           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
5830             continue;
5831           break;
5832         }
5833
5834       /* Check the suffix.  */
5835       i.error = invalid_instruction_suffix;
5836       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5837           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5838           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5839           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5840           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5841           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5842         continue;
5843
5844       size_match = operand_size_match (t);
5845       if (!size_match)
5846         continue;
5847
5848       /* This is intentionally not
5849
5850          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5851
5852          as the case of a missing * on the operand is accepted (perhaps with
5853          a warning, issued further down).  */
5854       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5855         {
5856           i.error = operand_type_mismatch;
5857           continue;
5858         }
5859
5860       for (j = 0; j < MAX_OPERANDS; j++)
5861         operand_types[j] = t->operand_types[j];
5862
5863       /* In general, don't allow 64-bit operands in 32-bit mode.  */
5864       if (i.suffix == QWORD_MNEM_SUFFIX
5865           && flag_code != CODE_64BIT
5866           && (intel_syntax
5867               ? (!t->opcode_modifier.ignoresize
5868                  && !t->opcode_modifier.broadcast
5869                  && !intel_float_operand (t->name))
5870               : intel_float_operand (t->name) != 2)
5871           && ((operand_types[0].bitfield.class != RegMMX
5872                && operand_types[0].bitfield.class != RegSIMD)
5873               || (operand_types[t->operands > 1].bitfield.class != RegMMX
5874                   && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5875           && (t->base_opcode != 0x0fc7
5876               || t->extension_opcode != 1 /* cmpxchg8b */))
5877         continue;
5878
5879       /* In general, don't allow 32-bit operands on pre-386.  */
5880       else if (i.suffix == LONG_MNEM_SUFFIX
5881                && !cpu_arch_flags.bitfield.cpui386
5882                && (intel_syntax
5883                    ? (!t->opcode_modifier.ignoresize
5884                       && !intel_float_operand (t->name))
5885                    : intel_float_operand (t->name) != 2)
5886                && ((operand_types[0].bitfield.class != RegMMX
5887                     && operand_types[0].bitfield.class != RegSIMD)
5888                    || (operand_types[t->operands > 1].bitfield.class != RegMMX
5889                        && operand_types[t->operands > 1].bitfield.class
5890                           != RegSIMD)))
5891         continue;
5892
5893       /* Do not verify operands when there are none.  */
5894       else
5895         {
5896           if (!t->operands)
5897             /* We've found a match; break out of loop.  */
5898             break;
5899         }
5900
5901       if (!t->opcode_modifier.jump
5902           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5903         {
5904           /* There should be only one Disp operand.  */
5905           for (j = 0; j < MAX_OPERANDS; j++)
5906             if (operand_type_check (operand_types[j], disp))
5907               break;
5908           if (j < MAX_OPERANDS)
5909             {
5910               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5911
5912               addr_prefix_disp = j;
5913
5914               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5915                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
5916               switch (flag_code)
5917                 {
5918                 case CODE_16BIT:
5919                   override = !override;
5920                   /* Fall through.  */
5921                 case CODE_32BIT:
5922                   if (operand_types[j].bitfield.disp32
5923                       && operand_types[j].bitfield.disp16)
5924                     {
5925                       operand_types[j].bitfield.disp16 = override;
5926                       operand_types[j].bitfield.disp32 = !override;
5927                     }
5928                   operand_types[j].bitfield.disp32s = 0;
5929                   operand_types[j].bitfield.disp64 = 0;
5930                   break;
5931
5932                 case CODE_64BIT:
5933                   if (operand_types[j].bitfield.disp32s
5934                       || operand_types[j].bitfield.disp64)
5935                     {
5936                       operand_types[j].bitfield.disp64 &= !override;
5937                       operand_types[j].bitfield.disp32s &= !override;
5938                       operand_types[j].bitfield.disp32 = override;
5939                     }
5940                   operand_types[j].bitfield.disp16 = 0;
5941                   break;
5942                 }
5943             }
5944         }
5945
5946       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
5947       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5948         continue;
5949
5950       /* We check register size if needed.  */
5951       if (t->opcode_modifier.checkregsize)
5952         {
5953           check_register = (1 << t->operands) - 1;
5954           if (i.broadcast)
5955             check_register &= ~(1 << i.broadcast->operand);
5956         }
5957       else
5958         check_register = 0;
5959
5960       overlap0 = operand_type_and (i.types[0], operand_types[0]);
5961       switch (t->operands)
5962         {
5963         case 1:
5964           if (!operand_type_match (overlap0, i.types[0]))
5965             continue;
5966           break;
5967         case 2:
5968           /* xchg %eax, %eax is a special case. It is an alias for nop
5969              only in 32bit mode and we can use opcode 0x90.  In 64bit
5970              mode, we can't use 0x90 for xchg %eax, %eax since it should
5971              zero-extend %eax to %rax.  */
5972           if (flag_code == CODE_64BIT
5973               && t->base_opcode == 0x90
5974               && i.types[0].bitfield.instance == Accum
5975               && i.types[0].bitfield.dword
5976               && i.types[1].bitfield.instance == Accum
5977               && i.types[1].bitfield.dword)
5978             continue;
5979           /* xrelease mov %eax, <disp> is another special case. It must not
5980              match the accumulator-only encoding of mov.  */
5981           if (flag_code != CODE_64BIT
5982               && i.hle_prefix
5983               && t->base_opcode == 0xa0
5984               && i.types[0].bitfield.instance == Accum
5985               && (i.flags[1] & Operand_Mem))
5986             continue;
5987           /* Fall through.  */
5988
5989         case 3:
5990           if (!(size_match & MATCH_STRAIGHT))
5991             goto check_reverse;
5992           /* Reverse direction of operands if swapping is possible in the first
5993              place (operands need to be symmetric) and
5994              - the load form is requested, and the template is a store form,
5995              - the store form is requested, and the template is a load form,
5996              - the non-default (swapped) form is requested.  */
5997           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5998           if (t->opcode_modifier.d && i.reg_operands == i.operands
5999               && !operand_type_all_zero (&overlap1))
6000             switch (i.dir_encoding)
6001               {
6002               case dir_encoding_load:
6003                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6004                     || t->opcode_modifier.regmem)
6005                   goto check_reverse;
6006                 break;
6007
6008               case dir_encoding_store:
6009                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6010                     && !t->opcode_modifier.regmem)
6011                   goto check_reverse;
6012                 break;
6013
6014               case dir_encoding_swap:
6015                 goto check_reverse;
6016
6017               case dir_encoding_default:
6018                 break;
6019               }
6020           /* If we want store form, we skip the current load.  */
6021           if ((i.dir_encoding == dir_encoding_store
6022                || i.dir_encoding == dir_encoding_swap)
6023               && i.mem_operands == 0
6024               && t->opcode_modifier.load)
6025             continue;
6026           /* Fall through.  */
6027         case 4:
6028         case 5:
6029           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6030           if (!operand_type_match (overlap0, i.types[0])
6031               || !operand_type_match (overlap1, i.types[1])
6032               || ((check_register & 3) == 3
6033                   && !operand_type_register_match (i.types[0],
6034                                                    operand_types[0],
6035                                                    i.types[1],
6036                                                    operand_types[1])))
6037             {
6038               /* Check if other direction is valid ...  */
6039               if (!t->opcode_modifier.d)
6040                 continue;
6041
6042 check_reverse:
6043               if (!(size_match & MATCH_REVERSE))
6044                 continue;
6045               /* Try reversing direction of operands.  */
6046               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6047               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6048               if (!operand_type_match (overlap0, i.types[0])
6049                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6050                   || (check_register
6051                       && !operand_type_register_match (i.types[0],
6052                                                        operand_types[i.operands - 1],
6053                                                        i.types[i.operands - 1],
6054                                                        operand_types[0])))
6055                 {
6056                   /* Does not match either direction.  */
6057                   continue;
6058                 }
6059               /* found_reverse_match holds which of D or FloatR
6060                  we've found.  */
6061               if (!t->opcode_modifier.d)
6062                 found_reverse_match = 0;
6063               else if (operand_types[0].bitfield.tbyte)
6064                 found_reverse_match = Opcode_FloatD;
6065               else if (operand_types[0].bitfield.xmmword
6066                        || operand_types[i.operands - 1].bitfield.xmmword
6067                        || operand_types[0].bitfield.class == RegMMX
6068                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6069                        || is_any_vex_encoding(t))
6070                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6071                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6072               else
6073                 found_reverse_match = Opcode_D;
6074               if (t->opcode_modifier.floatr)
6075                 found_reverse_match |= Opcode_FloatR;
6076             }
6077           else
6078             {
6079               /* Found a forward 2 operand match here.  */
6080               switch (t->operands)
6081                 {
6082                 case 5:
6083                   overlap4 = operand_type_and (i.types[4],
6084                                                operand_types[4]);
6085                   /* Fall through.  */
6086                 case 4:
6087                   overlap3 = operand_type_and (i.types[3],
6088                                                operand_types[3]);
6089                   /* Fall through.  */
6090                 case 3:
6091                   overlap2 = operand_type_and (i.types[2],
6092                                                operand_types[2]);
6093                   break;
6094                 }
6095
6096               switch (t->operands)
6097                 {
6098                 case 5:
6099                   if (!operand_type_match (overlap4, i.types[4])
6100                       || !operand_type_register_match (i.types[3],
6101                                                        operand_types[3],
6102                                                        i.types[4],
6103                                                        operand_types[4]))
6104                     continue;
6105                   /* Fall through.  */
6106                 case 4:
6107                   if (!operand_type_match (overlap3, i.types[3])
6108                       || ((check_register & 0xa) == 0xa
6109                           && !operand_type_register_match (i.types[1],
6110                                                             operand_types[1],
6111                                                             i.types[3],
6112                                                             operand_types[3]))
6113                       || ((check_register & 0xc) == 0xc
6114                           && !operand_type_register_match (i.types[2],
6115                                                             operand_types[2],
6116                                                             i.types[3],
6117                                                             operand_types[3])))
6118                     continue;
6119                   /* Fall through.  */
6120                 case 3:
6121                   /* Here we make use of the fact that there are no
6122                      reverse match 3 operand instructions.  */
6123                   if (!operand_type_match (overlap2, i.types[2])
6124                       || ((check_register & 5) == 5
6125                           && !operand_type_register_match (i.types[0],
6126                                                             operand_types[0],
6127                                                             i.types[2],
6128                                                             operand_types[2]))
6129                       || ((check_register & 6) == 6
6130                           && !operand_type_register_match (i.types[1],
6131                                                             operand_types[1],
6132                                                             i.types[2],
6133                                                             operand_types[2])))
6134                     continue;
6135                   break;
6136                 }
6137             }
6138           /* Found either forward/reverse 2, 3 or 4 operand match here:
6139              slip through to break.  */
6140         }
6141
6142       /* Check if vector and VEX operands are valid.  */
6143       if (check_VecOperands (t) || VEX_check_operands (t))
6144         {
6145           specific_error = i.error;
6146           continue;
6147         }
6148
6149       /* We've found a match; break out of loop.  */
6150       break;
6151     }
6152
6153   if (t == current_templates->end)
6154     {
6155       /* We found no match.  */
6156       const char *err_msg;
6157       switch (specific_error ? specific_error : i.error)
6158         {
6159         default:
6160           abort ();
6161         case operand_size_mismatch:
6162           err_msg = _("operand size mismatch");
6163           break;
6164         case operand_type_mismatch:
6165           err_msg = _("operand type mismatch");
6166           break;
6167         case register_type_mismatch:
6168           err_msg = _("register type mismatch");
6169           break;
6170         case number_of_operands_mismatch:
6171           err_msg = _("number of operands mismatch");
6172           break;
6173         case invalid_instruction_suffix:
6174           err_msg = _("invalid instruction suffix");
6175           break;
6176         case bad_imm4:
6177           err_msg = _("constant doesn't fit in 4 bits");
6178           break;
6179         case unsupported_with_intel_mnemonic:
6180           err_msg = _("unsupported with Intel mnemonic");
6181           break;
6182         case unsupported_syntax:
6183           err_msg = _("unsupported syntax");
6184           break;
6185         case unsupported:
6186           as_bad (_("unsupported instruction `%s'"),
6187                   current_templates->start->name);
6188           return NULL;
6189         case invalid_vsib_address:
6190           err_msg = _("invalid VSIB address");
6191           break;
6192         case invalid_vector_register_set:
6193           err_msg = _("mask, index, and destination registers must be distinct");
6194           break;
6195         case unsupported_vector_index_register:
6196           err_msg = _("unsupported vector index register");
6197           break;
6198         case unsupported_broadcast:
6199           err_msg = _("unsupported broadcast");
6200           break;
6201         case broadcast_needed:
6202           err_msg = _("broadcast is needed for operand of such type");
6203           break;
6204         case unsupported_masking:
6205           err_msg = _("unsupported masking");
6206           break;
6207         case mask_not_on_destination:
6208           err_msg = _("mask not on destination operand");
6209           break;
6210         case no_default_mask:
6211           err_msg = _("default mask isn't allowed");
6212           break;
6213         case unsupported_rc_sae:
6214           err_msg = _("unsupported static rounding/sae");
6215           break;
6216         case rc_sae_operand_not_last_imm:
6217           if (intel_syntax)
6218             err_msg = _("RC/SAE operand must precede immediate operands");
6219           else
6220             err_msg = _("RC/SAE operand must follow immediate operands");
6221           break;
6222         case invalid_register_operand:
6223           err_msg = _("invalid register operand");
6224           break;
6225         }
6226       as_bad (_("%s for `%s'"), err_msg,
6227               current_templates->start->name);
6228       return NULL;
6229     }
6230
6231   if (!quiet_warnings)
6232     {
6233       if (!intel_syntax
6234           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6235         as_warn (_("indirect %s without `*'"), t->name);
6236
6237       if (t->opcode_modifier.isprefix
6238           && t->opcode_modifier.ignoresize)
6239         {
6240           /* Warn them that a data or address size prefix doesn't
6241              affect assembly of the next line of code.  */
6242           as_warn (_("stand-alone `%s' prefix"), t->name);
6243         }
6244     }
6245
6246   /* Copy the template we found.  */
6247   i.tm = *t;
6248
6249   if (addr_prefix_disp != -1)
6250     i.tm.operand_types[addr_prefix_disp]
6251       = operand_types[addr_prefix_disp];
6252
6253   if (found_reverse_match)
6254     {
6255       /* If we found a reverse match we must alter the opcode direction
6256          bit and clear/flip the regmem modifier one.  found_reverse_match
6257          holds bits to change (different for int & float insns).  */
6258
6259       i.tm.base_opcode ^= found_reverse_match;
6260
6261       i.tm.operand_types[0] = operand_types[i.operands - 1];
6262       i.tm.operand_types[i.operands - 1] = operand_types[0];
6263
6264       /* Certain SIMD insns have their load forms specified in the opcode
6265          table, and hence we need to _set_ RegMem instead of clearing it.
6266          We need to avoid setting the bit though on insns like KMOVW.  */
6267       i.tm.opcode_modifier.regmem
6268         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6269           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6270           && !i.tm.opcode_modifier.regmem;
6271     }
6272
6273   return t;
6274 }
6275
6276 static int
6277 check_string (void)
6278 {
6279   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6280   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6281
6282   if (i.seg[op] != NULL && i.seg[op] != &es)
6283     {
6284       as_bad (_("`%s' operand %u must use `%ses' segment"),
6285               i.tm.name,
6286               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6287               register_prefix);
6288       return 0;
6289     }
6290
6291   /* There's only ever one segment override allowed per instruction.
6292      This instruction possibly has a legal segment override on the
6293      second operand, so copy the segment to where non-string
6294      instructions store it, allowing common code.  */
6295   i.seg[op] = i.seg[1];
6296
6297   return 1;
6298 }
6299
6300 static int
6301 process_suffix (void)
6302 {
6303   /* If matched instruction specifies an explicit instruction mnemonic
6304      suffix, use it.  */
6305   if (i.tm.opcode_modifier.size == SIZE16)
6306     i.suffix = WORD_MNEM_SUFFIX;
6307   else if (i.tm.opcode_modifier.size == SIZE32)
6308     i.suffix = LONG_MNEM_SUFFIX;
6309   else if (i.tm.opcode_modifier.size == SIZE64)
6310     i.suffix = QWORD_MNEM_SUFFIX;
6311   else if (i.reg_operands
6312            && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6313     {
6314       /* If there's no instruction mnemonic suffix we try to invent one
6315          based on GPR operands.  */
6316       if (!i.suffix)
6317         {
6318           /* We take i.suffix from the last register operand specified,
6319              Destination register type is more significant than source
6320              register type.  crc32 in SSE4.2 prefers source register
6321              type. */
6322           unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6323
6324           while (op--)
6325             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6326                 || i.tm.operand_types[op].bitfield.instance == Accum)
6327               {
6328                 if (i.types[op].bitfield.class != Reg)
6329                   continue;
6330                 if (i.types[op].bitfield.byte)
6331                   i.suffix = BYTE_MNEM_SUFFIX;
6332                 else if (i.types[op].bitfield.word)
6333                   i.suffix = WORD_MNEM_SUFFIX;
6334                 else if (i.types[op].bitfield.dword)
6335                   i.suffix = LONG_MNEM_SUFFIX;
6336                 else if (i.types[op].bitfield.qword)
6337                   i.suffix = QWORD_MNEM_SUFFIX;
6338                 else
6339                   continue;
6340                 break;
6341               }
6342         }
6343       else if (i.suffix == BYTE_MNEM_SUFFIX)
6344         {
6345           if (intel_syntax
6346               && i.tm.opcode_modifier.ignoresize
6347               && i.tm.opcode_modifier.no_bsuf)
6348             i.suffix = 0;
6349           else if (!check_byte_reg ())
6350             return 0;
6351         }
6352       else if (i.suffix == LONG_MNEM_SUFFIX)
6353         {
6354           if (intel_syntax
6355               && i.tm.opcode_modifier.ignoresize
6356               && i.tm.opcode_modifier.no_lsuf
6357               && !i.tm.opcode_modifier.todword
6358               && !i.tm.opcode_modifier.toqword)
6359             i.suffix = 0;
6360           else if (!check_long_reg ())
6361             return 0;
6362         }
6363       else if (i.suffix == QWORD_MNEM_SUFFIX)
6364         {
6365           if (intel_syntax
6366               && i.tm.opcode_modifier.ignoresize
6367               && i.tm.opcode_modifier.no_qsuf
6368               && !i.tm.opcode_modifier.todword
6369               && !i.tm.opcode_modifier.toqword)
6370             i.suffix = 0;
6371           else if (!check_qword_reg ())
6372             return 0;
6373         }
6374       else if (i.suffix == WORD_MNEM_SUFFIX)
6375         {
6376           if (intel_syntax
6377               && i.tm.opcode_modifier.ignoresize
6378               && i.tm.opcode_modifier.no_wsuf)
6379             i.suffix = 0;
6380           else if (!check_word_reg ())
6381             return 0;
6382         }
6383       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6384         /* Do nothing if the instruction is going to ignore the prefix.  */
6385         ;
6386       else
6387         abort ();
6388     }
6389   else if (i.tm.opcode_modifier.defaultsize && !i.suffix)
6390     {
6391       i.suffix = stackop_size;
6392       if (stackop_size == LONG_MNEM_SUFFIX)
6393         {
6394           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6395              .code16gcc directive to support 16-bit mode with
6396              32-bit address.  For IRET without a suffix, generate
6397              16-bit IRET (opcode 0xcf) to return from an interrupt
6398              handler.  */
6399           if (i.tm.base_opcode == 0xcf)
6400             {
6401               i.suffix = WORD_MNEM_SUFFIX;
6402               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6403             }
6404           /* Warn about changed behavior for segment register push/pop.  */
6405           else if ((i.tm.base_opcode | 1) == 0x07)
6406             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6407                      i.tm.name);
6408         }
6409     }
6410   else if (!i.suffix
6411            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6412                || i.tm.opcode_modifier.jump == JUMP_BYTE
6413                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6414                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6415                    && i.tm.extension_opcode <= 3)))
6416     {
6417       switch (flag_code)
6418         {
6419         case CODE_64BIT:
6420           if (!i.tm.opcode_modifier.no_qsuf)
6421             {
6422               i.suffix = QWORD_MNEM_SUFFIX;
6423               break;
6424             }
6425           /* Fall through.  */
6426         case CODE_32BIT:
6427           if (!i.tm.opcode_modifier.no_lsuf)
6428             i.suffix = LONG_MNEM_SUFFIX;
6429           break;
6430         case CODE_16BIT:
6431           if (!i.tm.opcode_modifier.no_wsuf)
6432             i.suffix = WORD_MNEM_SUFFIX;
6433           break;
6434         }
6435     }
6436
6437   if (!i.suffix
6438       && (!i.tm.opcode_modifier.defaultsize
6439           /* Also cover lret/retf/iret in 64-bit mode.  */
6440           || (flag_code == CODE_64BIT
6441               && !i.tm.opcode_modifier.no_lsuf
6442               && !i.tm.opcode_modifier.no_qsuf))
6443       && !i.tm.opcode_modifier.ignoresize
6444       /* Accept FLDENV et al without suffix.  */
6445       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6446     {
6447       unsigned int suffixes, evex = 0;
6448
6449       suffixes = !i.tm.opcode_modifier.no_bsuf;
6450       if (!i.tm.opcode_modifier.no_wsuf)
6451         suffixes |= 1 << 1;
6452       if (!i.tm.opcode_modifier.no_lsuf)
6453         suffixes |= 1 << 2;
6454       if (!i.tm.opcode_modifier.no_ldsuf)
6455         suffixes |= 1 << 3;
6456       if (!i.tm.opcode_modifier.no_ssuf)
6457         suffixes |= 1 << 4;
6458       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6459         suffixes |= 1 << 5;
6460
6461       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6462          also suitable for AT&T syntax mode, it was requested that this be
6463          restricted to just Intel syntax.  */
6464       if (intel_syntax)
6465         {
6466           i386_cpu_flags cpu = cpu_flags_and (i.tm.cpu_flags, avx512);
6467
6468           if (!cpu_flags_all_zero (&cpu) && !i.broadcast)
6469             {
6470               unsigned int op;
6471
6472               for (op = 0; op < i.tm.operands; ++op)
6473                 {
6474                   if (!cpu_arch_flags.bitfield.cpuavx512vl)
6475                     {
6476                       if (i.tm.operand_types[op].bitfield.ymmword)
6477                         i.tm.operand_types[op].bitfield.xmmword = 0;
6478                       if (i.tm.operand_types[op].bitfield.zmmword)
6479                         i.tm.operand_types[op].bitfield.ymmword = 0;
6480                       if (!i.tm.opcode_modifier.evex
6481                           || i.tm.opcode_modifier.evex == EVEXDYN)
6482                         i.tm.opcode_modifier.evex = EVEX512;
6483                     }
6484
6485                   if (i.tm.operand_types[op].bitfield.xmmword
6486                       + i.tm.operand_types[op].bitfield.ymmword
6487                       + i.tm.operand_types[op].bitfield.zmmword < 2)
6488                     continue;
6489
6490                   /* Any properly sized operand disambiguates the insn.  */
6491                   if (i.types[op].bitfield.xmmword
6492                       || i.types[op].bitfield.ymmword
6493                       || i.types[op].bitfield.zmmword)
6494                     {
6495                       suffixes &= ~(7 << 6);
6496                       evex = 0;
6497                       break;
6498                     }
6499
6500                   if ((i.flags[op] & Operand_Mem)
6501                       && i.tm.operand_types[op].bitfield.unspecified)
6502                     {
6503                       if (i.tm.operand_types[op].bitfield.xmmword)
6504                         suffixes |= 1 << 6;
6505                       if (i.tm.operand_types[op].bitfield.ymmword)
6506                         suffixes |= 1 << 7;
6507                       if (i.tm.operand_types[op].bitfield.zmmword)
6508                         suffixes |= 1 << 8;
6509                       evex = EVEX512;
6510                     }
6511                 }
6512             }
6513         }
6514
6515       /* Are multiple suffixes / operand sizes allowed?  */
6516       if (suffixes & (suffixes - 1))
6517         {
6518           if (intel_syntax
6519               && (!i.tm.opcode_modifier.defaultsize
6520                   || operand_check == check_error))
6521             {
6522               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6523               return 0;
6524             }
6525           if (operand_check == check_error)
6526             {
6527               as_bad (_("no instruction mnemonic suffix given and "
6528                         "no register operands; can't size `%s'"), i.tm.name);
6529               return 0;
6530             }
6531           if (operand_check == check_warning)
6532             as_warn (_("%s; using default for `%s'"),
6533                        intel_syntax
6534                        ? _("ambiguous operand size")
6535                        : _("no instruction mnemonic suffix given and "
6536                            "no register operands"),
6537                        i.tm.name);
6538
6539           if (i.tm.opcode_modifier.floatmf)
6540             i.suffix = SHORT_MNEM_SUFFIX;
6541           else if (evex)
6542             i.tm.opcode_modifier.evex = evex;
6543           else if (flag_code == CODE_16BIT)
6544             i.suffix = WORD_MNEM_SUFFIX;
6545           else if (!i.tm.opcode_modifier.no_lsuf)
6546             i.suffix = LONG_MNEM_SUFFIX;
6547           else
6548             i.suffix = QWORD_MNEM_SUFFIX;
6549         }
6550     }
6551
6552   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6553     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6554                    != (i.tm.operand_types[1].bitfield.class == Reg);
6555
6556   /* Change the opcode based on the operand size given by i.suffix.  */
6557   switch (i.suffix)
6558     {
6559     /* Size floating point instruction.  */
6560     case LONG_MNEM_SUFFIX:
6561       if (i.tm.opcode_modifier.floatmf)
6562         {
6563           i.tm.base_opcode ^= 4;
6564           break;
6565         }
6566     /* fall through */
6567     case WORD_MNEM_SUFFIX:
6568     case QWORD_MNEM_SUFFIX:
6569       /* It's not a byte, select word/dword operation.  */
6570       if (i.tm.opcode_modifier.w)
6571         {
6572           if (i.short_form)
6573             i.tm.base_opcode |= 8;
6574           else
6575             i.tm.base_opcode |= 1;
6576         }
6577     /* fall through */
6578     case SHORT_MNEM_SUFFIX:
6579       /* Now select between word & dword operations via the operand
6580          size prefix, except for instructions that will ignore this
6581          prefix anyway.  */
6582       if (i.reg_operands > 0
6583           && i.types[0].bitfield.class == Reg
6584           && i.tm.opcode_modifier.addrprefixopreg
6585           && (i.tm.operand_types[0].bitfield.instance == Accum
6586               || i.operands == 1))
6587         {
6588           /* The address size override prefix changes the size of the
6589              first operand.  */
6590           if ((flag_code == CODE_32BIT
6591                && i.op[0].regs->reg_type.bitfield.word)
6592               || (flag_code != CODE_32BIT
6593                   && i.op[0].regs->reg_type.bitfield.dword))
6594             if (!add_prefix (ADDR_PREFIX_OPCODE))
6595               return 0;
6596         }
6597       else if (i.suffix != QWORD_MNEM_SUFFIX
6598                && !i.tm.opcode_modifier.ignoresize
6599                && !i.tm.opcode_modifier.floatmf
6600                && !is_any_vex_encoding (&i.tm)
6601                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6602                    || (flag_code == CODE_64BIT
6603                        && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6604         {
6605           unsigned int prefix = DATA_PREFIX_OPCODE;
6606
6607           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6608             prefix = ADDR_PREFIX_OPCODE;
6609
6610           if (!add_prefix (prefix))
6611             return 0;
6612         }
6613
6614       /* Set mode64 for an operand.  */
6615       if (i.suffix == QWORD_MNEM_SUFFIX
6616           && flag_code == CODE_64BIT
6617           && !i.tm.opcode_modifier.norex64
6618           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
6619              need rex64. */
6620           && ! (i.operands == 2
6621                 && i.tm.base_opcode == 0x90
6622                 && i.tm.extension_opcode == None
6623                 && i.types[0].bitfield.instance == Accum
6624                 && i.types[0].bitfield.qword
6625                 && i.types[1].bitfield.instance == Accum
6626                 && i.types[1].bitfield.qword))
6627         i.rex |= REX_W;
6628
6629       break;
6630     }
6631
6632   if (i.reg_operands != 0
6633       && i.operands > 1
6634       && i.tm.opcode_modifier.addrprefixopreg
6635       && i.tm.operand_types[0].bitfield.instance != Accum)
6636     {
6637       /* Check invalid register operand when the address size override
6638          prefix changes the size of register operands.  */
6639       unsigned int op;
6640       enum { need_word, need_dword, need_qword } need;
6641
6642       if (flag_code == CODE_32BIT)
6643         need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6644       else
6645         {
6646           if (i.prefix[ADDR_PREFIX])
6647             need = need_dword;
6648           else
6649             need = flag_code == CODE_64BIT ? need_qword : need_word;
6650         }
6651
6652       for (op = 0; op < i.operands; op++)
6653         if (i.types[op].bitfield.class == Reg
6654             && ((need == need_word
6655                  && !i.op[op].regs->reg_type.bitfield.word)
6656                 || (need == need_dword
6657                     && !i.op[op].regs->reg_type.bitfield.dword)
6658                 || (need == need_qword
6659                     && !i.op[op].regs->reg_type.bitfield.qword)))
6660           {
6661             as_bad (_("invalid register operand size for `%s'"),
6662                     i.tm.name);
6663             return 0;
6664           }
6665     }
6666
6667   return 1;
6668 }
6669
6670 static int
6671 check_byte_reg (void)
6672 {
6673   int op;
6674
6675   for (op = i.operands; --op >= 0;)
6676     {
6677       /* Skip non-register operands. */
6678       if (i.types[op].bitfield.class != Reg)
6679         continue;
6680
6681       /* If this is an eight bit register, it's OK.  If it's the 16 or
6682          32 bit version of an eight bit register, we will just use the
6683          low portion, and that's OK too.  */
6684       if (i.types[op].bitfield.byte)
6685         continue;
6686
6687       /* I/O port address operands are OK too.  */
6688       if (i.tm.operand_types[op].bitfield.instance == RegD
6689           && i.tm.operand_types[op].bitfield.word)
6690         continue;
6691
6692       /* crc32 only wants its source operand checked here.  */
6693       if (i.tm.base_opcode == 0xf20f38f0 && op)
6694         continue;
6695
6696       /* Any other register is bad.  */
6697       if (i.types[op].bitfield.class == Reg
6698           || i.types[op].bitfield.class == RegMMX
6699           || i.types[op].bitfield.class == RegSIMD
6700           || i.types[op].bitfield.class == SReg
6701           || i.types[op].bitfield.class == RegCR
6702           || i.types[op].bitfield.class == RegDR
6703           || i.types[op].bitfield.class == RegTR)
6704         {
6705           as_bad (_("`%s%s' not allowed with `%s%c'"),
6706                   register_prefix,
6707                   i.op[op].regs->reg_name,
6708                   i.tm.name,
6709                   i.suffix);
6710           return 0;
6711         }
6712     }
6713   return 1;
6714 }
6715
6716 static int
6717 check_long_reg (void)
6718 {
6719   int op;
6720
6721   for (op = i.operands; --op >= 0;)
6722     /* Skip non-register operands. */
6723     if (i.types[op].bitfield.class != Reg)
6724       continue;
6725     /* Reject eight bit registers, except where the template requires
6726        them. (eg. movzb)  */
6727     else if (i.types[op].bitfield.byte
6728              && (i.tm.operand_types[op].bitfield.class == Reg
6729                  || i.tm.operand_types[op].bitfield.instance == Accum)
6730              && (i.tm.operand_types[op].bitfield.word
6731                  || i.tm.operand_types[op].bitfield.dword))
6732       {
6733         as_bad (_("`%s%s' not allowed with `%s%c'"),
6734                 register_prefix,
6735                 i.op[op].regs->reg_name,
6736                 i.tm.name,
6737                 i.suffix);
6738         return 0;
6739       }
6740     /* Error if the e prefix on a general reg is missing.  */
6741     else if (i.types[op].bitfield.word
6742              && (i.tm.operand_types[op].bitfield.class == Reg
6743                  || i.tm.operand_types[op].bitfield.instance == Accum)
6744              && i.tm.operand_types[op].bitfield.dword)
6745       {
6746         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6747                 register_prefix, i.op[op].regs->reg_name,
6748                 i.suffix);
6749         return 0;
6750       }
6751     /* Warn if the r prefix on a general reg is present.  */
6752     else if (i.types[op].bitfield.qword
6753              && (i.tm.operand_types[op].bitfield.class == Reg
6754                  || i.tm.operand_types[op].bitfield.instance == Accum)
6755              && i.tm.operand_types[op].bitfield.dword)
6756       {
6757         if (intel_syntax
6758             && (i.tm.opcode_modifier.toqword
6759                 /* Also convert to QWORD for MOVSXD.  */
6760                 || i.tm.base_opcode == 0x63)
6761             && i.types[0].bitfield.class != RegSIMD)
6762           {
6763             /* Convert to QWORD.  We want REX byte. */
6764             i.suffix = QWORD_MNEM_SUFFIX;
6765           }
6766         else
6767           {
6768             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6769                     register_prefix, i.op[op].regs->reg_name,
6770                     i.suffix);
6771             return 0;
6772           }
6773       }
6774   return 1;
6775 }
6776
6777 static int
6778 check_qword_reg (void)
6779 {
6780   int op;
6781
6782   for (op = i.operands; --op >= 0; )
6783     /* Skip non-register operands. */
6784     if (i.types[op].bitfield.class != Reg)
6785       continue;
6786     /* Reject eight bit registers, except where the template requires
6787        them. (eg. movzb)  */
6788     else if (i.types[op].bitfield.byte
6789              && (i.tm.operand_types[op].bitfield.class == Reg
6790                  || i.tm.operand_types[op].bitfield.instance == Accum)
6791              && (i.tm.operand_types[op].bitfield.word
6792                  || i.tm.operand_types[op].bitfield.dword))
6793       {
6794         as_bad (_("`%s%s' not allowed with `%s%c'"),
6795                 register_prefix,
6796                 i.op[op].regs->reg_name,
6797                 i.tm.name,
6798                 i.suffix);
6799         return 0;
6800       }
6801     /* Warn if the r prefix on a general reg is missing.  */
6802     else if ((i.types[op].bitfield.word
6803               || i.types[op].bitfield.dword)
6804              && (i.tm.operand_types[op].bitfield.class == Reg
6805                  || i.tm.operand_types[op].bitfield.instance == Accum)
6806              && i.tm.operand_types[op].bitfield.qword)
6807       {
6808         /* Prohibit these changes in the 64bit mode, since the
6809            lowering is more complicated.  */
6810         if (intel_syntax
6811             && i.tm.opcode_modifier.todword
6812             && i.types[0].bitfield.class != RegSIMD)
6813           {
6814             /* Convert to DWORD.  We don't want REX byte. */
6815             i.suffix = LONG_MNEM_SUFFIX;
6816           }
6817         else
6818           {
6819             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6820                     register_prefix, i.op[op].regs->reg_name,
6821                     i.suffix);
6822             return 0;
6823           }
6824       }
6825   return 1;
6826 }
6827
6828 static int
6829 check_word_reg (void)
6830 {
6831   int op;
6832   for (op = i.operands; --op >= 0;)
6833     /* Skip non-register operands. */
6834     if (i.types[op].bitfield.class != Reg)
6835       continue;
6836     /* Reject eight bit registers, except where the template requires
6837        them. (eg. movzb)  */
6838     else if (i.types[op].bitfield.byte
6839              && (i.tm.operand_types[op].bitfield.class == Reg
6840                  || i.tm.operand_types[op].bitfield.instance == Accum)
6841              && (i.tm.operand_types[op].bitfield.word
6842                  || i.tm.operand_types[op].bitfield.dword))
6843       {
6844         as_bad (_("`%s%s' not allowed with `%s%c'"),
6845                 register_prefix,
6846                 i.op[op].regs->reg_name,
6847                 i.tm.name,
6848                 i.suffix);
6849         return 0;
6850       }
6851     /* Error if the e or r prefix on a general reg is present.  */
6852     else if ((i.types[op].bitfield.dword
6853                  || i.types[op].bitfield.qword)
6854              && (i.tm.operand_types[op].bitfield.class == Reg
6855                  || i.tm.operand_types[op].bitfield.instance == Accum)
6856              && i.tm.operand_types[op].bitfield.word)
6857       {
6858         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6859                 register_prefix, i.op[op].regs->reg_name,
6860                 i.suffix);
6861         return 0;
6862       }
6863   return 1;
6864 }
6865
6866 static int
6867 update_imm (unsigned int j)
6868 {
6869   i386_operand_type overlap = i.types[j];
6870   if ((overlap.bitfield.imm8
6871        || overlap.bitfield.imm8s
6872        || overlap.bitfield.imm16
6873        || overlap.bitfield.imm32
6874        || overlap.bitfield.imm32s
6875        || overlap.bitfield.imm64)
6876       && !operand_type_equal (&overlap, &imm8)
6877       && !operand_type_equal (&overlap, &imm8s)
6878       && !operand_type_equal (&overlap, &imm16)
6879       && !operand_type_equal (&overlap, &imm32)
6880       && !operand_type_equal (&overlap, &imm32s)
6881       && !operand_type_equal (&overlap, &imm64))
6882     {
6883       if (i.suffix)
6884         {
6885           i386_operand_type temp;
6886
6887           operand_type_set (&temp, 0);
6888           if (i.suffix == BYTE_MNEM_SUFFIX)
6889             {
6890               temp.bitfield.imm8 = overlap.bitfield.imm8;
6891               temp.bitfield.imm8s = overlap.bitfield.imm8s;
6892             }
6893           else if (i.suffix == WORD_MNEM_SUFFIX)
6894             temp.bitfield.imm16 = overlap.bitfield.imm16;
6895           else if (i.suffix == QWORD_MNEM_SUFFIX)
6896             {
6897               temp.bitfield.imm64 = overlap.bitfield.imm64;
6898               temp.bitfield.imm32s = overlap.bitfield.imm32s;
6899             }
6900           else
6901             temp.bitfield.imm32 = overlap.bitfield.imm32;
6902           overlap = temp;
6903         }
6904       else if (operand_type_equal (&overlap, &imm16_32_32s)
6905                || operand_type_equal (&overlap, &imm16_32)
6906                || operand_type_equal (&overlap, &imm16_32s))
6907         {
6908           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6909             overlap = imm16;
6910           else
6911             overlap = imm32s;
6912         }
6913       if (!operand_type_equal (&overlap, &imm8)
6914           && !operand_type_equal (&overlap, &imm8s)
6915           && !operand_type_equal (&overlap, &imm16)
6916           && !operand_type_equal (&overlap, &imm32)
6917           && !operand_type_equal (&overlap, &imm32s)
6918           && !operand_type_equal (&overlap, &imm64))
6919         {
6920           as_bad (_("no instruction mnemonic suffix given; "
6921                     "can't determine immediate size"));
6922           return 0;
6923         }
6924     }
6925   i.types[j] = overlap;
6926
6927   return 1;
6928 }
6929
6930 static int
6931 finalize_imm (void)
6932 {
6933   unsigned int j, n;
6934
6935   /* Update the first 2 immediate operands.  */
6936   n = i.operands > 2 ? 2 : i.operands;
6937   if (n)
6938     {
6939       for (j = 0; j < n; j++)
6940         if (update_imm (j) == 0)
6941           return 0;
6942
6943       /* The 3rd operand can't be immediate operand.  */
6944       gas_assert (operand_type_check (i.types[2], imm) == 0);
6945     }
6946
6947   return 1;
6948 }
6949
6950 static int
6951 process_operands (void)
6952 {
6953   /* Default segment register this instruction will use for memory
6954      accesses.  0 means unknown.  This is only for optimizing out
6955      unnecessary segment overrides.  */
6956   const seg_entry *default_seg = 0;
6957
6958   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6959     {
6960       unsigned int dupl = i.operands;
6961       unsigned int dest = dupl - 1;
6962       unsigned int j;
6963
6964       /* The destination must be an xmm register.  */
6965       gas_assert (i.reg_operands
6966                   && MAX_OPERANDS > dupl
6967                   && operand_type_equal (&i.types[dest], &regxmm));
6968
6969       if (i.tm.operand_types[0].bitfield.instance == Accum
6970           && i.tm.operand_types[0].bitfield.xmmword)
6971         {
6972           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6973             {
6974               /* Keep xmm0 for instructions with VEX prefix and 3
6975                  sources.  */
6976               i.tm.operand_types[0].bitfield.instance = InstanceNone;
6977               i.tm.operand_types[0].bitfield.class = RegSIMD;
6978               goto duplicate;
6979             }
6980           else
6981             {
6982               /* We remove the first xmm0 and keep the number of
6983                  operands unchanged, which in fact duplicates the
6984                  destination.  */
6985               for (j = 1; j < i.operands; j++)
6986                 {
6987                   i.op[j - 1] = i.op[j];
6988                   i.types[j - 1] = i.types[j];
6989                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6990                   i.flags[j - 1] = i.flags[j];
6991                 }
6992             }
6993         }
6994       else if (i.tm.opcode_modifier.implicit1stxmm0)
6995         {
6996           gas_assert ((MAX_OPERANDS - 1) > dupl
6997                       && (i.tm.opcode_modifier.vexsources
6998                           == VEX3SOURCES));
6999
7000           /* Add the implicit xmm0 for instructions with VEX prefix
7001              and 3 sources.  */
7002           for (j = i.operands; j > 0; j--)
7003             {
7004               i.op[j] = i.op[j - 1];
7005               i.types[j] = i.types[j - 1];
7006               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7007               i.flags[j] = i.flags[j - 1];
7008             }
7009           i.op[0].regs
7010             = (const reg_entry *) hash_find (reg_hash, "xmm0");
7011           i.types[0] = regxmm;
7012           i.tm.operand_types[0] = regxmm;
7013
7014           i.operands += 2;
7015           i.reg_operands += 2;
7016           i.tm.operands += 2;
7017
7018           dupl++;
7019           dest++;
7020           i.op[dupl] = i.op[dest];
7021           i.types[dupl] = i.types[dest];
7022           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7023           i.flags[dupl] = i.flags[dest];
7024         }
7025       else
7026         {
7027 duplicate:
7028           i.operands++;
7029           i.reg_operands++;
7030           i.tm.operands++;
7031
7032           i.op[dupl] = i.op[dest];
7033           i.types[dupl] = i.types[dest];
7034           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7035           i.flags[dupl] = i.flags[dest];
7036         }
7037
7038        if (i.tm.opcode_modifier.immext)
7039          process_immext ();
7040     }
7041   else if (i.tm.operand_types[0].bitfield.instance == Accum
7042            && i.tm.operand_types[0].bitfield.xmmword)
7043     {
7044       unsigned int j;
7045
7046       for (j = 1; j < i.operands; j++)
7047         {
7048           i.op[j - 1] = i.op[j];
7049           i.types[j - 1] = i.types[j];
7050
7051           /* We need to adjust fields in i.tm since they are used by
7052              build_modrm_byte.  */
7053           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7054
7055           i.flags[j - 1] = i.flags[j];
7056         }
7057
7058       i.operands--;
7059       i.reg_operands--;
7060       i.tm.operands--;
7061     }
7062   else if (i.tm.opcode_modifier.implicitquadgroup)
7063     {
7064       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7065
7066       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7067       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7068       regnum = register_number (i.op[1].regs);
7069       first_reg_in_group = regnum & ~3;
7070       last_reg_in_group = first_reg_in_group + 3;
7071       if (regnum != first_reg_in_group)
7072         as_warn (_("source register `%s%s' implicitly denotes"
7073                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7074                  register_prefix, i.op[1].regs->reg_name,
7075                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7076                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7077                  i.tm.name);
7078     }
7079   else if (i.tm.opcode_modifier.regkludge)
7080     {
7081       /* The imul $imm, %reg instruction is converted into
7082          imul $imm, %reg, %reg, and the clr %reg instruction
7083          is converted into xor %reg, %reg.  */
7084
7085       unsigned int first_reg_op;
7086
7087       if (operand_type_check (i.types[0], reg))
7088         first_reg_op = 0;
7089       else
7090         first_reg_op = 1;
7091       /* Pretend we saw the extra register operand.  */
7092       gas_assert (i.reg_operands == 1
7093                   && i.op[first_reg_op + 1].regs == 0);
7094       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7095       i.types[first_reg_op + 1] = i.types[first_reg_op];
7096       i.operands++;
7097       i.reg_operands++;
7098     }
7099
7100   if (i.tm.opcode_modifier.modrm)
7101     {
7102       /* The opcode is completed (modulo i.tm.extension_opcode which
7103          must be put into the modrm byte).  Now, we make the modrm and
7104          index base bytes based on all the info we've collected.  */
7105
7106       default_seg = build_modrm_byte ();
7107     }
7108   else if (i.types[0].bitfield.class == SReg)
7109     {
7110       if (flag_code != CODE_64BIT
7111           ? i.tm.base_opcode == POP_SEG_SHORT
7112             && i.op[0].regs->reg_num == 1
7113           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7114             && i.op[0].regs->reg_num < 4)
7115         {
7116           as_bad (_("you can't `%s %s%s'"),
7117                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7118           return 0;
7119         }
7120       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7121         {
7122           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7123           i.tm.opcode_length = 2;
7124         }
7125       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7126     }
7127   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7128     {
7129       default_seg = &ds;
7130     }
7131   else if (i.tm.opcode_modifier.isstring)
7132     {
7133       /* For the string instructions that allow a segment override
7134          on one of their operands, the default segment is ds.  */
7135       default_seg = &ds;
7136     }
7137   else if (i.short_form)
7138     {
7139       /* The register or float register operand is in operand
7140          0 or 1.  */
7141       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7142
7143       /* Register goes in low 3 bits of opcode.  */
7144       i.tm.base_opcode |= i.op[op].regs->reg_num;
7145       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7146         i.rex |= REX_B;
7147       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7148         {
7149           /* Warn about some common errors, but press on regardless.
7150              The first case can be generated by gcc (<= 2.8.1).  */
7151           if (i.operands == 2)
7152             {
7153               /* Reversed arguments on faddp, fsubp, etc.  */
7154               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7155                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7156                        register_prefix, i.op[intel_syntax].regs->reg_name);
7157             }
7158           else
7159             {
7160               /* Extraneous `l' suffix on fp insn.  */
7161               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7162                        register_prefix, i.op[0].regs->reg_name);
7163             }
7164         }
7165     }
7166
7167   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7168       && i.tm.base_opcode == 0x8d /* lea */
7169       && !is_any_vex_encoding(&i.tm))
7170     {
7171       if (!quiet_warnings)
7172         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7173       if (optimize)
7174         {
7175           i.seg[0] = NULL;
7176           i.prefix[SEG_PREFIX] = 0;
7177         }
7178     }
7179
7180   /* If a segment was explicitly specified, and the specified segment
7181      is not the default, use an opcode prefix to select it.  If we
7182      never figured out what the default segment is, then default_seg
7183      will be zero at this point, and the specified segment prefix will
7184      always be used.  */
7185   if ((i.seg[0]) && (i.seg[0] != default_seg))
7186     {
7187       if (!add_prefix (i.seg[0]->seg_prefix))
7188         return 0;
7189     }
7190   return 1;
7191 }
7192
7193 static const seg_entry *
7194 build_modrm_byte (void)
7195 {
7196   const seg_entry *default_seg = 0;
7197   unsigned int source, dest;
7198   int vex_3_sources;
7199
7200   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7201   if (vex_3_sources)
7202     {
7203       unsigned int nds, reg_slot;
7204       expressionS *exp;
7205
7206       dest = i.operands - 1;
7207       nds = dest - 1;
7208
7209       /* There are 2 kinds of instructions:
7210          1. 5 operands: 4 register operands or 3 register operands
7211          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7212          VexW0 or VexW1.  The destination must be either XMM, YMM or
7213          ZMM register.
7214          2. 4 operands: 4 register operands or 3 register operands
7215          plus 1 memory operand, with VexXDS.  */
7216       gas_assert ((i.reg_operands == 4
7217                    || (i.reg_operands == 3 && i.mem_operands == 1))
7218                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7219                   && i.tm.opcode_modifier.vexw
7220                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7221
7222       /* If VexW1 is set, the first non-immediate operand is the source and
7223          the second non-immediate one is encoded in the immediate operand.  */
7224       if (i.tm.opcode_modifier.vexw == VEXW1)
7225         {
7226           source = i.imm_operands;
7227           reg_slot = i.imm_operands + 1;
7228         }
7229       else
7230         {
7231           source = i.imm_operands + 1;
7232           reg_slot = i.imm_operands;
7233         }
7234
7235       if (i.imm_operands == 0)
7236         {
7237           /* When there is no immediate operand, generate an 8bit
7238              immediate operand to encode the first operand.  */
7239           exp = &im_expressions[i.imm_operands++];
7240           i.op[i.operands].imms = exp;
7241           i.types[i.operands] = imm8;
7242           i.operands++;
7243
7244           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7245           exp->X_op = O_constant;
7246           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7247           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7248         }
7249       else
7250         {
7251           gas_assert (i.imm_operands == 1);
7252           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7253           gas_assert (!i.tm.opcode_modifier.immext);
7254
7255           /* Turn on Imm8 again so that output_imm will generate it.  */
7256           i.types[0].bitfield.imm8 = 1;
7257
7258           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7259           i.op[0].imms->X_add_number
7260               |= register_number (i.op[reg_slot].regs) << 4;
7261           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7262         }
7263
7264       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7265       i.vex.register_specifier = i.op[nds].regs;
7266     }
7267   else
7268     source = dest = 0;
7269
7270   /* i.reg_operands MUST be the number of real register operands;
7271      implicit registers do not count.  If there are 3 register
7272      operands, it must be a instruction with VexNDS.  For a
7273      instruction with VexNDD, the destination register is encoded
7274      in VEX prefix.  If there are 4 register operands, it must be
7275      a instruction with VEX prefix and 3 sources.  */
7276   if (i.mem_operands == 0
7277       && ((i.reg_operands == 2
7278            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7279           || (i.reg_operands == 3
7280               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7281           || (i.reg_operands == 4 && vex_3_sources)))
7282     {
7283       switch (i.operands)
7284         {
7285         case 2:
7286           source = 0;
7287           break;
7288         case 3:
7289           /* When there are 3 operands, one of them may be immediate,
7290              which may be the first or the last operand.  Otherwise,
7291              the first operand must be shift count register (cl) or it
7292              is an instruction with VexNDS. */
7293           gas_assert (i.imm_operands == 1
7294                       || (i.imm_operands == 0
7295                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7296                               || (i.types[0].bitfield.instance == RegC
7297                                   && i.types[0].bitfield.byte))));
7298           if (operand_type_check (i.types[0], imm)
7299               || (i.types[0].bitfield.instance == RegC
7300                   && i.types[0].bitfield.byte))
7301             source = 1;
7302           else
7303             source = 0;
7304           break;
7305         case 4:
7306           /* When there are 4 operands, the first two must be 8bit
7307              immediate operands. The source operand will be the 3rd
7308              one.
7309
7310              For instructions with VexNDS, if the first operand
7311              an imm8, the source operand is the 2nd one.  If the last
7312              operand is imm8, the source operand is the first one.  */
7313           gas_assert ((i.imm_operands == 2
7314                        && i.types[0].bitfield.imm8
7315                        && i.types[1].bitfield.imm8)
7316                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7317                           && i.imm_operands == 1
7318                           && (i.types[0].bitfield.imm8
7319                               || i.types[i.operands - 1].bitfield.imm8
7320                               || i.rounding)));
7321           if (i.imm_operands == 2)
7322             source = 2;
7323           else
7324             {
7325               if (i.types[0].bitfield.imm8)
7326                 source = 1;
7327               else
7328                 source = 0;
7329             }
7330           break;
7331         case 5:
7332           if (is_evex_encoding (&i.tm))
7333             {
7334               /* For EVEX instructions, when there are 5 operands, the
7335                  first one must be immediate operand.  If the second one
7336                  is immediate operand, the source operand is the 3th
7337                  one.  If the last one is immediate operand, the source
7338                  operand is the 2nd one.  */
7339               gas_assert (i.imm_operands == 2
7340                           && i.tm.opcode_modifier.sae
7341                           && operand_type_check (i.types[0], imm));
7342               if (operand_type_check (i.types[1], imm))
7343                 source = 2;
7344               else if (operand_type_check (i.types[4], imm))
7345                 source = 1;
7346               else
7347                 abort ();
7348             }
7349           break;
7350         default:
7351           abort ();
7352         }
7353
7354       if (!vex_3_sources)
7355         {
7356           dest = source + 1;
7357
7358           /* RC/SAE operand could be between DEST and SRC.  That happens
7359              when one operand is GPR and the other one is XMM/YMM/ZMM
7360              register.  */
7361           if (i.rounding && i.rounding->operand == (int) dest)
7362             dest++;
7363
7364           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7365             {
7366               /* For instructions with VexNDS, the register-only source
7367                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7368                  register.  It is encoded in VEX prefix.  */
7369
7370               i386_operand_type op;
7371               unsigned int vvvv;
7372
7373               /* Check register-only source operand when two source
7374                  operands are swapped.  */
7375               if (!i.tm.operand_types[source].bitfield.baseindex
7376                   && i.tm.operand_types[dest].bitfield.baseindex)
7377                 {
7378                   vvvv = source;
7379                   source = dest;
7380                 }
7381               else
7382                 vvvv = dest;
7383
7384               op = i.tm.operand_types[vvvv];
7385               if ((dest + 1) >= i.operands
7386                   || ((op.bitfield.class != Reg
7387                        || (!op.bitfield.dword && !op.bitfield.qword))
7388                       && op.bitfield.class != RegSIMD
7389                       && !operand_type_equal (&op, &regmask)))
7390                 abort ();
7391               i.vex.register_specifier = i.op[vvvv].regs;
7392               dest++;
7393             }
7394         }
7395
7396       i.rm.mode = 3;
7397       /* One of the register operands will be encoded in the i.rm.reg
7398          field, the other in the combined i.rm.mode and i.rm.regmem
7399          fields.  If no form of this instruction supports a memory
7400          destination operand, then we assume the source operand may
7401          sometimes be a memory operand and so we need to store the
7402          destination in the i.rm.reg field.  */
7403       if (!i.tm.opcode_modifier.regmem
7404           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7405         {
7406           i.rm.reg = i.op[dest].regs->reg_num;
7407           i.rm.regmem = i.op[source].regs->reg_num;
7408           if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7409                || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7410             i.has_regmmx = TRUE;
7411           else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7412                    || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7413             {
7414               if (i.types[dest].bitfield.zmmword
7415                   || i.types[source].bitfield.zmmword)
7416                 i.has_regzmm = TRUE;
7417               else if (i.types[dest].bitfield.ymmword
7418                        || i.types[source].bitfield.ymmword)
7419                 i.has_regymm = TRUE;
7420               else
7421                 i.has_regxmm = TRUE;
7422             }
7423           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7424             i.rex |= REX_R;
7425           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7426             i.vrex |= REX_R;
7427           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7428             i.rex |= REX_B;
7429           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7430             i.vrex |= REX_B;
7431         }
7432       else
7433         {
7434           i.rm.reg = i.op[source].regs->reg_num;
7435           i.rm.regmem = i.op[dest].regs->reg_num;
7436           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7437             i.rex |= REX_B;
7438           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7439             i.vrex |= REX_B;
7440           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7441             i.rex |= REX_R;
7442           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7443             i.vrex |= REX_R;
7444         }
7445       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7446         {
7447           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7448             abort ();
7449           i.rex &= ~REX_R;
7450           add_prefix (LOCK_PREFIX_OPCODE);
7451         }
7452     }
7453   else
7454     {                   /* If it's not 2 reg operands...  */
7455       unsigned int mem;
7456
7457       if (i.mem_operands)
7458         {
7459           unsigned int fake_zero_displacement = 0;
7460           unsigned int op;
7461
7462           for (op = 0; op < i.operands; op++)
7463             if (i.flags[op] & Operand_Mem)
7464               break;
7465           gas_assert (op < i.operands);
7466
7467           if (i.tm.opcode_modifier.vecsib)
7468             {
7469               if (i.index_reg->reg_num == RegIZ)
7470                 abort ();
7471
7472               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7473               if (!i.base_reg)
7474                 {
7475                   i.sib.base = NO_BASE_REGISTER;
7476                   i.sib.scale = i.log2_scale_factor;
7477                   i.types[op].bitfield.disp8 = 0;
7478                   i.types[op].bitfield.disp16 = 0;
7479                   i.types[op].bitfield.disp64 = 0;
7480                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7481                     {
7482                       /* Must be 32 bit */
7483                       i.types[op].bitfield.disp32 = 1;
7484                       i.types[op].bitfield.disp32s = 0;
7485                     }
7486                   else
7487                     {
7488                       i.types[op].bitfield.disp32 = 0;
7489                       i.types[op].bitfield.disp32s = 1;
7490                     }
7491                 }
7492               i.sib.index = i.index_reg->reg_num;
7493               if ((i.index_reg->reg_flags & RegRex) != 0)
7494                 i.rex |= REX_X;
7495               if ((i.index_reg->reg_flags & RegVRex) != 0)
7496                 i.vrex |= REX_X;
7497             }
7498
7499           default_seg = &ds;
7500
7501           if (i.base_reg == 0)
7502             {
7503               i.rm.mode = 0;
7504               if (!i.disp_operands)
7505                 fake_zero_displacement = 1;
7506               if (i.index_reg == 0)
7507                 {
7508                   i386_operand_type newdisp;
7509
7510                   gas_assert (!i.tm.opcode_modifier.vecsib);
7511                   /* Operand is just <disp>  */
7512                   if (flag_code == CODE_64BIT)
7513                     {
7514                       /* 64bit mode overwrites the 32bit absolute
7515                          addressing by RIP relative addressing and
7516                          absolute addressing is encoded by one of the
7517                          redundant SIB forms.  */
7518                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7519                       i.sib.base = NO_BASE_REGISTER;
7520                       i.sib.index = NO_INDEX_REGISTER;
7521                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7522                     }
7523                   else if ((flag_code == CODE_16BIT)
7524                            ^ (i.prefix[ADDR_PREFIX] != 0))
7525                     {
7526                       i.rm.regmem = NO_BASE_REGISTER_16;
7527                       newdisp = disp16;
7528                     }
7529                   else
7530                     {
7531                       i.rm.regmem = NO_BASE_REGISTER;
7532                       newdisp = disp32;
7533                     }
7534                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
7535                   i.types[op] = operand_type_or (i.types[op], newdisp);
7536                 }
7537               else if (!i.tm.opcode_modifier.vecsib)
7538                 {
7539                   /* !i.base_reg && i.index_reg  */
7540                   if (i.index_reg->reg_num == RegIZ)
7541                     i.sib.index = NO_INDEX_REGISTER;
7542                   else
7543                     i.sib.index = i.index_reg->reg_num;
7544                   i.sib.base = NO_BASE_REGISTER;
7545                   i.sib.scale = i.log2_scale_factor;
7546                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7547                   i.types[op].bitfield.disp8 = 0;
7548                   i.types[op].bitfield.disp16 = 0;
7549                   i.types[op].bitfield.disp64 = 0;
7550                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7551                     {
7552                       /* Must be 32 bit */
7553                       i.types[op].bitfield.disp32 = 1;
7554                       i.types[op].bitfield.disp32s = 0;
7555                     }
7556                   else
7557                     {
7558                       i.types[op].bitfield.disp32 = 0;
7559                       i.types[op].bitfield.disp32s = 1;
7560                     }
7561                   if ((i.index_reg->reg_flags & RegRex) != 0)
7562                     i.rex |= REX_X;
7563                 }
7564             }
7565           /* RIP addressing for 64bit mode.  */
7566           else if (i.base_reg->reg_num == RegIP)
7567             {
7568               gas_assert (!i.tm.opcode_modifier.vecsib);
7569               i.rm.regmem = NO_BASE_REGISTER;
7570               i.types[op].bitfield.disp8 = 0;
7571               i.types[op].bitfield.disp16 = 0;
7572               i.types[op].bitfield.disp32 = 0;
7573               i.types[op].bitfield.disp32s = 1;
7574               i.types[op].bitfield.disp64 = 0;
7575               i.flags[op] |= Operand_PCrel;
7576               if (! i.disp_operands)
7577                 fake_zero_displacement = 1;
7578             }
7579           else if (i.base_reg->reg_type.bitfield.word)
7580             {
7581               gas_assert (!i.tm.opcode_modifier.vecsib);
7582               switch (i.base_reg->reg_num)
7583                 {
7584                 case 3: /* (%bx)  */
7585                   if (i.index_reg == 0)
7586                     i.rm.regmem = 7;
7587                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
7588                     i.rm.regmem = i.index_reg->reg_num - 6;
7589                   break;
7590                 case 5: /* (%bp)  */
7591                   default_seg = &ss;
7592                   if (i.index_reg == 0)
7593                     {
7594                       i.rm.regmem = 6;
7595                       if (operand_type_check (i.types[op], disp) == 0)
7596                         {
7597                           /* fake (%bp) into 0(%bp)  */
7598                           i.types[op].bitfield.disp8 = 1;
7599                           fake_zero_displacement = 1;
7600                         }
7601                     }
7602                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
7603                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7604                   break;
7605                 default: /* (%si) -> 4 or (%di) -> 5  */
7606                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7607                 }
7608               i.rm.mode = mode_from_disp_size (i.types[op]);
7609             }
7610           else /* i.base_reg and 32/64 bit mode  */
7611             {
7612               if (flag_code == CODE_64BIT
7613                   && operand_type_check (i.types[op], disp))
7614                 {
7615                   i.types[op].bitfield.disp16 = 0;
7616                   i.types[op].bitfield.disp64 = 0;
7617                   if (i.prefix[ADDR_PREFIX] == 0)
7618                     {
7619                       i.types[op].bitfield.disp32 = 0;
7620                       i.types[op].bitfield.disp32s = 1;
7621                     }
7622                   else
7623                     {
7624                       i.types[op].bitfield.disp32 = 1;
7625                       i.types[op].bitfield.disp32s = 0;
7626                     }
7627                 }
7628
7629               if (!i.tm.opcode_modifier.vecsib)
7630                 i.rm.regmem = i.base_reg->reg_num;
7631               if ((i.base_reg->reg_flags & RegRex) != 0)
7632                 i.rex |= REX_B;
7633               i.sib.base = i.base_reg->reg_num;
7634               /* x86-64 ignores REX prefix bit here to avoid decoder
7635                  complications.  */
7636               if (!(i.base_reg->reg_flags & RegRex)
7637                   && (i.base_reg->reg_num == EBP_REG_NUM
7638                    || i.base_reg->reg_num == ESP_REG_NUM))
7639                   default_seg = &ss;
7640               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7641                 {
7642                   fake_zero_displacement = 1;
7643                   i.types[op].bitfield.disp8 = 1;
7644                 }
7645               i.sib.scale = i.log2_scale_factor;
7646               if (i.index_reg == 0)
7647                 {
7648                   gas_assert (!i.tm.opcode_modifier.vecsib);
7649                   /* <disp>(%esp) becomes two byte modrm with no index
7650                      register.  We've already stored the code for esp
7651                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7652                      Any base register besides %esp will not use the
7653                      extra modrm byte.  */
7654                   i.sib.index = NO_INDEX_REGISTER;
7655                 }
7656               else if (!i.tm.opcode_modifier.vecsib)
7657                 {
7658                   if (i.index_reg->reg_num == RegIZ)
7659                     i.sib.index = NO_INDEX_REGISTER;
7660                   else
7661                     i.sib.index = i.index_reg->reg_num;
7662                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7663                   if ((i.index_reg->reg_flags & RegRex) != 0)
7664                     i.rex |= REX_X;
7665                 }
7666
7667               if (i.disp_operands
7668                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7669                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7670                 i.rm.mode = 0;
7671               else
7672                 {
7673                   if (!fake_zero_displacement
7674                       && !i.disp_operands
7675                       && i.disp_encoding)
7676                     {
7677                       fake_zero_displacement = 1;
7678                       if (i.disp_encoding == disp_encoding_8bit)
7679                         i.types[op].bitfield.disp8 = 1;
7680                       else
7681                         i.types[op].bitfield.disp32 = 1;
7682                     }
7683                   i.rm.mode = mode_from_disp_size (i.types[op]);
7684                 }
7685             }
7686
7687           if (fake_zero_displacement)
7688             {
7689               /* Fakes a zero displacement assuming that i.types[op]
7690                  holds the correct displacement size.  */
7691               expressionS *exp;
7692
7693               gas_assert (i.op[op].disps == 0);
7694               exp = &disp_expressions[i.disp_operands++];
7695               i.op[op].disps = exp;
7696               exp->X_op = O_constant;
7697               exp->X_add_number = 0;
7698               exp->X_add_symbol = (symbolS *) 0;
7699               exp->X_op_symbol = (symbolS *) 0;
7700             }
7701
7702           mem = op;
7703         }
7704       else
7705         mem = ~0;
7706
7707       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7708         {
7709           if (operand_type_check (i.types[0], imm))
7710             i.vex.register_specifier = NULL;
7711           else
7712             {
7713               /* VEX.vvvv encodes one of the sources when the first
7714                  operand is not an immediate.  */
7715               if (i.tm.opcode_modifier.vexw == VEXW0)
7716                 i.vex.register_specifier = i.op[0].regs;
7717               else
7718                 i.vex.register_specifier = i.op[1].regs;
7719             }
7720
7721           /* Destination is a XMM register encoded in the ModRM.reg
7722              and VEX.R bit.  */
7723           i.rm.reg = i.op[2].regs->reg_num;
7724           if ((i.op[2].regs->reg_flags & RegRex) != 0)
7725             i.rex |= REX_R;
7726
7727           /* ModRM.rm and VEX.B encodes the other source.  */
7728           if (!i.mem_operands)
7729             {
7730               i.rm.mode = 3;
7731
7732               if (i.tm.opcode_modifier.vexw == VEXW0)
7733                 i.rm.regmem = i.op[1].regs->reg_num;
7734               else
7735                 i.rm.regmem = i.op[0].regs->reg_num;
7736
7737               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7738                 i.rex |= REX_B;
7739             }
7740         }
7741       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7742         {
7743           i.vex.register_specifier = i.op[2].regs;
7744           if (!i.mem_operands)
7745             {
7746               i.rm.mode = 3;
7747               i.rm.regmem = i.op[1].regs->reg_num;
7748               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7749                 i.rex |= REX_B;
7750             }
7751         }
7752       /* Fill in i.rm.reg or i.rm.regmem field with register operand
7753          (if any) based on i.tm.extension_opcode.  Again, we must be
7754          careful to make sure that segment/control/debug/test/MMX
7755          registers are coded into the i.rm.reg field.  */
7756       else if (i.reg_operands)
7757         {
7758           unsigned int op;
7759           unsigned int vex_reg = ~0;
7760
7761           for (op = 0; op < i.operands; op++)
7762             {
7763               if (i.types[op].bitfield.class == Reg
7764                   || i.types[op].bitfield.class == RegBND
7765                   || i.types[op].bitfield.class == RegMask
7766                   || i.types[op].bitfield.class == SReg
7767                   || i.types[op].bitfield.class == RegCR
7768                   || i.types[op].bitfield.class == RegDR
7769                   || i.types[op].bitfield.class == RegTR)
7770                 break;
7771               if (i.types[op].bitfield.class == RegSIMD)
7772                 {
7773                   if (i.types[op].bitfield.zmmword)
7774                     i.has_regzmm = TRUE;
7775                   else if (i.types[op].bitfield.ymmword)
7776                     i.has_regymm = TRUE;
7777                   else
7778                     i.has_regxmm = TRUE;
7779                   break;
7780                 }
7781               if (i.types[op].bitfield.class == RegMMX)
7782                 {
7783                   i.has_regmmx = TRUE;
7784                   break;
7785                 }
7786             }
7787
7788           if (vex_3_sources)
7789             op = dest;
7790           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7791             {
7792               /* For instructions with VexNDS, the register-only
7793                  source operand is encoded in VEX prefix. */
7794               gas_assert (mem != (unsigned int) ~0);
7795
7796               if (op > mem)
7797                 {
7798                   vex_reg = op++;
7799                   gas_assert (op < i.operands);
7800                 }
7801               else
7802                 {
7803                   /* Check register-only source operand when two source
7804                      operands are swapped.  */
7805                   if (!i.tm.operand_types[op].bitfield.baseindex
7806                       && i.tm.operand_types[op + 1].bitfield.baseindex)
7807                     {
7808                       vex_reg = op;
7809                       op += 2;
7810                       gas_assert (mem == (vex_reg + 1)
7811                                   && op < i.operands);
7812                     }
7813                   else
7814                     {
7815                       vex_reg = op + 1;
7816                       gas_assert (vex_reg < i.operands);
7817                     }
7818                 }
7819             }
7820           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7821             {
7822               /* For instructions with VexNDD, the register destination
7823                  is encoded in VEX prefix.  */
7824               if (i.mem_operands == 0)
7825                 {
7826                   /* There is no memory operand.  */
7827                   gas_assert ((op + 2) == i.operands);
7828                   vex_reg = op + 1;
7829                 }
7830               else
7831                 {
7832                   /* There are only 2 non-immediate operands.  */
7833                   gas_assert (op < i.imm_operands + 2
7834                               && i.operands == i.imm_operands + 2);
7835                   vex_reg = i.imm_operands + 1;
7836                 }
7837             }
7838           else
7839             gas_assert (op < i.operands);
7840
7841           if (vex_reg != (unsigned int) ~0)
7842             {
7843               i386_operand_type *type = &i.tm.operand_types[vex_reg];
7844
7845               if ((type->bitfield.class != Reg
7846                    || (!type->bitfield.dword && !type->bitfield.qword))
7847                   && type->bitfield.class != RegSIMD
7848                   && !operand_type_equal (type, &regmask))
7849                 abort ();
7850
7851               i.vex.register_specifier = i.op[vex_reg].regs;
7852             }
7853
7854           /* Don't set OP operand twice.  */
7855           if (vex_reg != op)
7856             {
7857               /* If there is an extension opcode to put here, the
7858                  register number must be put into the regmem field.  */
7859               if (i.tm.extension_opcode != None)
7860                 {
7861                   i.rm.regmem = i.op[op].regs->reg_num;
7862                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7863                     i.rex |= REX_B;
7864                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7865                     i.vrex |= REX_B;
7866                 }
7867               else
7868                 {
7869                   i.rm.reg = i.op[op].regs->reg_num;
7870                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7871                     i.rex |= REX_R;
7872                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7873                     i.vrex |= REX_R;
7874                 }
7875             }
7876
7877           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7878              must set it to 3 to indicate this is a register operand
7879              in the regmem field.  */
7880           if (!i.mem_operands)
7881             i.rm.mode = 3;
7882         }
7883
7884       /* Fill in i.rm.reg field with extension opcode (if any).  */
7885       if (i.tm.extension_opcode != None)
7886         i.rm.reg = i.tm.extension_opcode;
7887     }
7888   return default_seg;
7889 }
7890
7891 static unsigned int
7892 flip_code16 (unsigned int code16)
7893 {
7894   gas_assert (i.tm.operands == 1);
7895
7896   return !(i.prefix[REX_PREFIX] & REX_W)
7897          && (code16 ? i.tm.operand_types[0].bitfield.disp32
7898                       || i.tm.operand_types[0].bitfield.disp32s
7899                     : i.tm.operand_types[0].bitfield.disp16)
7900          ? CODE16 : 0;
7901 }
7902
7903 static void
7904 output_branch (void)
7905 {
7906   char *p;
7907   int size;
7908   int code16;
7909   int prefix;
7910   relax_substateT subtype;
7911   symbolS *sym;
7912   offsetT off;
7913
7914   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7915   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7916
7917   prefix = 0;
7918   if (i.prefix[DATA_PREFIX] != 0)
7919     {
7920       prefix = 1;
7921       i.prefixes -= 1;
7922       code16 ^= flip_code16(code16);
7923     }
7924   /* Pentium4 branch hints.  */
7925   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7926       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7927     {
7928       prefix++;
7929       i.prefixes--;
7930     }
7931   if (i.prefix[REX_PREFIX] != 0)
7932     {
7933       prefix++;
7934       i.prefixes--;
7935     }
7936
7937   /* BND prefixed jump.  */
7938   if (i.prefix[BND_PREFIX] != 0)
7939     {
7940       prefix++;
7941       i.prefixes--;
7942     }
7943
7944   if (i.prefixes != 0)
7945     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7946
7947   /* It's always a symbol;  End frag & setup for relax.
7948      Make sure there is enough room in this frag for the largest
7949      instruction we may generate in md_convert_frag.  This is 2
7950      bytes for the opcode and room for the prefix and largest
7951      displacement.  */
7952   frag_grow (prefix + 2 + 4);
7953   /* Prefix and 1 opcode byte go in fr_fix.  */
7954   p = frag_more (prefix + 1);
7955   if (i.prefix[DATA_PREFIX] != 0)
7956     *p++ = DATA_PREFIX_OPCODE;
7957   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7958       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7959     *p++ = i.prefix[SEG_PREFIX];
7960   if (i.prefix[BND_PREFIX] != 0)
7961     *p++ = BND_PREFIX_OPCODE;
7962   if (i.prefix[REX_PREFIX] != 0)
7963     *p++ = i.prefix[REX_PREFIX];
7964   *p = i.tm.base_opcode;
7965
7966   if ((unsigned char) *p == JUMP_PC_RELATIVE)
7967     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7968   else if (cpu_arch_flags.bitfield.cpui386)
7969     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7970   else
7971     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7972   subtype |= code16;
7973
7974   sym = i.op[0].disps->X_add_symbol;
7975   off = i.op[0].disps->X_add_number;
7976
7977   if (i.op[0].disps->X_op != O_constant
7978       && i.op[0].disps->X_op != O_symbol)
7979     {
7980       /* Handle complex expressions.  */
7981       sym = make_expr_symbol (i.op[0].disps);
7982       off = 0;
7983     }
7984
7985   /* 1 possible extra opcode + 4 byte displacement go in var part.
7986      Pass reloc in fr_var.  */
7987   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7988 }
7989
7990 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7991 /* Return TRUE iff PLT32 relocation should be used for branching to
7992    symbol S.  */
7993
7994 static bfd_boolean
7995 need_plt32_p (symbolS *s)
7996 {
7997   /* PLT32 relocation is ELF only.  */
7998   if (!IS_ELF)
7999     return FALSE;
8000
8001 #ifdef TE_SOLARIS
8002   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8003      krtld support it.  */
8004   return FALSE;
8005 #endif
8006
8007   /* Since there is no need to prepare for PLT branch on x86-64, we
8008      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8009      be used as a marker for 32-bit PC-relative branches.  */
8010   if (!object_64bit)
8011     return FALSE;
8012
8013   /* Weak or undefined symbol need PLT32 relocation.  */
8014   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8015     return TRUE;
8016
8017   /* Non-global symbol doesn't need PLT32 relocation.  */
8018   if (! S_IS_EXTERNAL (s))
8019     return FALSE;
8020
8021   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8022      non-default visibilities are treated as normal global symbol
8023      so that PLT32 relocation can be used as a marker for 32-bit
8024      PC-relative branches.  It is useful for linker relaxation.  */
8025   return TRUE;
8026 }
8027 #endif
8028
8029 static void
8030 output_jump (void)
8031 {
8032   char *p;
8033   int size;
8034   fixS *fixP;
8035   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8036
8037   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8038     {
8039       /* This is a loop or jecxz type instruction.  */
8040       size = 1;
8041       if (i.prefix[ADDR_PREFIX] != 0)
8042         {
8043           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8044           i.prefixes -= 1;
8045         }
8046       /* Pentium4 branch hints.  */
8047       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8048           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8049         {
8050           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8051           i.prefixes--;
8052         }
8053     }
8054   else
8055     {
8056       int code16;
8057
8058       code16 = 0;
8059       if (flag_code == CODE_16BIT)
8060         code16 = CODE16;
8061
8062       if (i.prefix[DATA_PREFIX] != 0)
8063         {
8064           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8065           i.prefixes -= 1;
8066           code16 ^= flip_code16(code16);
8067         }
8068
8069       size = 4;
8070       if (code16)
8071         size = 2;
8072     }
8073
8074   /* BND prefixed jump.  */
8075   if (i.prefix[BND_PREFIX] != 0)
8076     {
8077       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8078       i.prefixes -= 1;
8079     }
8080
8081   if (i.prefix[REX_PREFIX] != 0)
8082     {
8083       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8084       i.prefixes -= 1;
8085     }
8086
8087   if (i.prefixes != 0)
8088     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8089
8090   p = frag_more (i.tm.opcode_length + size);
8091   switch (i.tm.opcode_length)
8092     {
8093     case 2:
8094       *p++ = i.tm.base_opcode >> 8;
8095       /* Fall through.  */
8096     case 1:
8097       *p++ = i.tm.base_opcode;
8098       break;
8099     default:
8100       abort ();
8101     }
8102
8103 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8104   if (size == 4
8105       && jump_reloc == NO_RELOC
8106       && need_plt32_p (i.op[0].disps->X_add_symbol))
8107     jump_reloc = BFD_RELOC_X86_64_PLT32;
8108 #endif
8109
8110   jump_reloc = reloc (size, 1, 1, jump_reloc);
8111
8112   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8113                       i.op[0].disps, 1, jump_reloc);
8114
8115   /* All jumps handled here are signed, but don't use a signed limit
8116      check for 32 and 16 bit jumps as we want to allow wrap around at
8117      4G and 64k respectively.  */
8118   if (size == 1)
8119     fixP->fx_signed = 1;
8120 }
8121
8122 static void
8123 output_interseg_jump (void)
8124 {
8125   char *p;
8126   int size;
8127   int prefix;
8128   int code16;
8129
8130   code16 = 0;
8131   if (flag_code == CODE_16BIT)
8132     code16 = CODE16;
8133
8134   prefix = 0;
8135   if (i.prefix[DATA_PREFIX] != 0)
8136     {
8137       prefix = 1;
8138       i.prefixes -= 1;
8139       code16 ^= CODE16;
8140     }
8141
8142   gas_assert (!i.prefix[REX_PREFIX]);
8143
8144   size = 4;
8145   if (code16)
8146     size = 2;
8147
8148   if (i.prefixes != 0)
8149     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8150
8151   /* 1 opcode; 2 segment; offset  */
8152   p = frag_more (prefix + 1 + 2 + size);
8153
8154   if (i.prefix[DATA_PREFIX] != 0)
8155     *p++ = DATA_PREFIX_OPCODE;
8156
8157   if (i.prefix[REX_PREFIX] != 0)
8158     *p++ = i.prefix[REX_PREFIX];
8159
8160   *p++ = i.tm.base_opcode;
8161   if (i.op[1].imms->X_op == O_constant)
8162     {
8163       offsetT n = i.op[1].imms->X_add_number;
8164
8165       if (size == 2
8166           && !fits_in_unsigned_word (n)
8167           && !fits_in_signed_word (n))
8168         {
8169           as_bad (_("16-bit jump out of range"));
8170           return;
8171         }
8172       md_number_to_chars (p, n, size);
8173     }
8174   else
8175     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8176                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8177   if (i.op[0].imms->X_op != O_constant)
8178     as_bad (_("can't handle non absolute segment in `%s'"),
8179             i.tm.name);
8180   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8181 }
8182
8183 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8184 void
8185 x86_cleanup (void)
8186 {
8187   char *p;
8188   asection *seg = now_seg;
8189   subsegT subseg = now_subseg;
8190   asection *sec;
8191   unsigned int alignment, align_size_1;
8192   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8193   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8194   unsigned int padding;
8195
8196   if (!IS_ELF || !x86_used_note)
8197     return;
8198
8199   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8200
8201   /* The .note.gnu.property section layout:
8202
8203      Field      Length          Contents
8204      ----       ----            ----
8205      n_namsz    4               4
8206      n_descsz   4               The note descriptor size
8207      n_type     4               NT_GNU_PROPERTY_TYPE_0
8208      n_name     4               "GNU"
8209      n_desc     n_descsz        The program property array
8210      ....       ....            ....
8211    */
8212
8213   /* Create the .note.gnu.property section.  */
8214   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8215   bfd_set_section_flags (sec,
8216                          (SEC_ALLOC
8217                           | SEC_LOAD
8218                           | SEC_DATA
8219                           | SEC_HAS_CONTENTS
8220                           | SEC_READONLY));
8221
8222   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8223     {
8224       align_size_1 = 7;
8225       alignment = 3;
8226     }
8227   else
8228     {
8229       align_size_1 = 3;
8230       alignment = 2;
8231     }
8232
8233   bfd_set_section_alignment (sec, alignment);
8234   elf_section_type (sec) = SHT_NOTE;
8235
8236   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8237                                   + 4-byte data  */
8238   isa_1_descsz_raw = 4 + 4 + 4;
8239   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8240   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8241
8242   feature_2_descsz_raw = isa_1_descsz;
8243   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8244                                       + 4-byte data  */
8245   feature_2_descsz_raw += 4 + 4 + 4;
8246   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8247   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8248                       & ~align_size_1);
8249
8250   descsz = feature_2_descsz;
8251   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8252   p = frag_more (4 + 4 + 4 + 4 + descsz);
8253
8254   /* Write n_namsz.  */
8255   md_number_to_chars (p, (valueT) 4, 4);
8256
8257   /* Write n_descsz.  */
8258   md_number_to_chars (p + 4, (valueT) descsz, 4);
8259
8260   /* Write n_type.  */
8261   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8262
8263   /* Write n_name.  */
8264   memcpy (p + 4 * 3, "GNU", 4);
8265
8266   /* Write 4-byte type.  */
8267   md_number_to_chars (p + 4 * 4,
8268                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8269
8270   /* Write 4-byte data size.  */
8271   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8272
8273   /* Write 4-byte data.  */
8274   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8275
8276   /* Zero out paddings.  */
8277   padding = isa_1_descsz - isa_1_descsz_raw;
8278   if (padding)
8279     memset (p + 4 * 7, 0, padding);
8280
8281   /* Write 4-byte type.  */
8282   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8283                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8284
8285   /* Write 4-byte data size.  */
8286   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8287
8288   /* Write 4-byte data.  */
8289   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8290                       (valueT) x86_feature_2_used, 4);
8291
8292   /* Zero out paddings.  */
8293   padding = feature_2_descsz - feature_2_descsz_raw;
8294   if (padding)
8295     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8296
8297   /* We probably can't restore the current segment, for there likely
8298      isn't one yet...  */
8299   if (seg && subseg)
8300     subseg_set (seg, subseg);
8301 }
8302 #endif
8303
8304 static unsigned int
8305 encoding_length (const fragS *start_frag, offsetT start_off,
8306                  const char *frag_now_ptr)
8307 {
8308   unsigned int len = 0;
8309
8310   if (start_frag != frag_now)
8311     {
8312       const fragS *fr = start_frag;
8313
8314       do {
8315         len += fr->fr_fix;
8316         fr = fr->fr_next;
8317       } while (fr && fr != frag_now);
8318     }
8319
8320   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8321 }
8322
8323 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8324    be macro-fused with conditional jumps.  */
8325
8326 static int
8327 maybe_fused_with_jcc_p (void)
8328 {
8329   /* No RIP address.  */
8330   if (i.base_reg && i.base_reg->reg_num == RegIP)
8331     return 0;
8332
8333   /* No VEX/EVEX encoding.  */
8334   if (is_any_vex_encoding (&i.tm))
8335     return 0;
8336
8337   /* and, add, sub with destination register.  */
8338   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8339       || i.tm.base_opcode <= 5
8340       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8341       || ((i.tm.base_opcode | 3) == 0x83
8342           && ((i.tm.extension_opcode | 1) == 0x5
8343               || i.tm.extension_opcode == 0x0)))
8344     return (i.types[1].bitfield.class == Reg
8345             || i.types[1].bitfield.instance == Accum);
8346
8347   /* test, cmp with any register.  */
8348   if ((i.tm.base_opcode | 1) == 0x85
8349       || (i.tm.base_opcode | 1) == 0xa9
8350       || ((i.tm.base_opcode | 1) == 0xf7
8351           && i.tm.extension_opcode == 0)
8352       || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8353       || ((i.tm.base_opcode | 3) == 0x83
8354           && (i.tm.extension_opcode == 0x7)))
8355     return (i.types[0].bitfield.class == Reg
8356             || i.types[0].bitfield.instance == Accum
8357             || i.types[1].bitfield.class == Reg
8358             || i.types[1].bitfield.instance == Accum);
8359
8360   /* inc, dec with any register.   */
8361   if ((i.tm.cpu_flags.bitfield.cpuno64
8362        && (i.tm.base_opcode | 0xf) == 0x4f)
8363       || ((i.tm.base_opcode | 1) == 0xff
8364           && i.tm.extension_opcode <= 0x1))
8365     return (i.types[0].bitfield.class == Reg
8366             || i.types[0].bitfield.instance == Accum);
8367
8368   return 0;
8369 }
8370
8371 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8372
8373 static int
8374 add_fused_jcc_padding_frag_p (void)
8375 {
8376   /* NB: Don't work with COND_JUMP86 without i386.  */
8377   if (!align_branch_power
8378       || now_seg == absolute_section
8379       || !cpu_arch_flags.bitfield.cpui386
8380       || !(align_branch & align_branch_fused_bit))
8381     return 0;
8382
8383   if (maybe_fused_with_jcc_p ())
8384     {
8385       if (last_insn.kind == last_insn_other
8386           || last_insn.seg != now_seg)
8387         return 1;
8388       if (flag_debug)
8389         as_warn_where (last_insn.file, last_insn.line,
8390                        _("`%s` skips -malign-branch-boundary on `%s`"),
8391                        last_insn.name, i.tm.name);
8392     }
8393
8394   return 0;
8395 }
8396
8397 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
8398
8399 static int
8400 add_branch_prefix_frag_p (void)
8401 {
8402   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
8403      to PadLock instructions since they include prefixes in opcode.  */
8404   if (!align_branch_power
8405       || !align_branch_prefix_size
8406       || now_seg == absolute_section
8407       || i.tm.cpu_flags.bitfield.cpupadlock
8408       || !cpu_arch_flags.bitfield.cpui386)
8409     return 0;
8410
8411   /* Don't add prefix if it is a prefix or there is no operand in case
8412      that segment prefix is special.  */
8413   if (!i.operands || i.tm.opcode_modifier.isprefix)
8414     return 0;
8415
8416   if (last_insn.kind == last_insn_other
8417       || last_insn.seg != now_seg)
8418     return 1;
8419
8420   if (flag_debug)
8421     as_warn_where (last_insn.file, last_insn.line,
8422                    _("`%s` skips -malign-branch-boundary on `%s`"),
8423                    last_insn.name, i.tm.name);
8424
8425   return 0;
8426 }
8427
8428 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
8429
8430 static int
8431 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8432 {
8433   int add_padding;
8434
8435   /* NB: Don't work with COND_JUMP86 without i386.  */
8436   if (!align_branch_power
8437       || now_seg == absolute_section
8438       || !cpu_arch_flags.bitfield.cpui386)
8439     return 0;
8440
8441   add_padding = 0;
8442
8443   /* Check for jcc and direct jmp.  */
8444   if (i.tm.opcode_modifier.jump == JUMP)
8445     {
8446       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8447         {
8448           *branch_p = align_branch_jmp;
8449           add_padding = align_branch & align_branch_jmp_bit;
8450         }
8451       else
8452         {
8453           *branch_p = align_branch_jcc;
8454           if ((align_branch & align_branch_jcc_bit))
8455             add_padding = 1;
8456         }
8457     }
8458   else if (is_any_vex_encoding (&i.tm))
8459     return 0;
8460   else if ((i.tm.base_opcode | 1) == 0xc3)
8461     {
8462       /* Near ret.  */
8463       *branch_p = align_branch_ret;
8464       if ((align_branch & align_branch_ret_bit))
8465         add_padding = 1;
8466     }
8467   else
8468     {
8469       /* Check for indirect jmp, direct and indirect calls.  */
8470       if (i.tm.base_opcode == 0xe8)
8471         {
8472           /* Direct call.  */
8473           *branch_p = align_branch_call;
8474           if ((align_branch & align_branch_call_bit))
8475             add_padding = 1;
8476         }
8477       else if (i.tm.base_opcode == 0xff
8478                && (i.tm.extension_opcode == 2
8479                    || i.tm.extension_opcode == 4))
8480         {
8481           /* Indirect call and jmp.  */
8482           *branch_p = align_branch_indirect;
8483           if ((align_branch & align_branch_indirect_bit))
8484             add_padding = 1;
8485         }
8486
8487       if (add_padding
8488           && i.disp_operands
8489           && tls_get_addr
8490           && (i.op[0].disps->X_op == O_symbol
8491               || (i.op[0].disps->X_op == O_subtract
8492                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
8493         {
8494           symbolS *s = i.op[0].disps->X_add_symbol;
8495           /* No padding to call to global or undefined tls_get_addr.  */
8496           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8497               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8498             return 0;
8499         }
8500     }
8501
8502   if (add_padding
8503       && last_insn.kind != last_insn_other
8504       && last_insn.seg == now_seg)
8505     {
8506       if (flag_debug)
8507         as_warn_where (last_insn.file, last_insn.line,
8508                        _("`%s` skips -malign-branch-boundary on `%s`"),
8509                        last_insn.name, i.tm.name);
8510       return 0;
8511     }
8512
8513   return add_padding;
8514 }
8515
8516 static void
8517 output_insn (void)
8518 {
8519   fragS *insn_start_frag;
8520   offsetT insn_start_off;
8521   fragS *fragP = NULL;
8522   enum align_branch_kind branch = align_branch_none;
8523
8524 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8525   if (IS_ELF && x86_used_note)
8526     {
8527       if (i.tm.cpu_flags.bitfield.cpucmov)
8528         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8529       if (i.tm.cpu_flags.bitfield.cpusse)
8530         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8531       if (i.tm.cpu_flags.bitfield.cpusse2)
8532         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8533       if (i.tm.cpu_flags.bitfield.cpusse3)
8534         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8535       if (i.tm.cpu_flags.bitfield.cpussse3)
8536         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8537       if (i.tm.cpu_flags.bitfield.cpusse4_1)
8538         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8539       if (i.tm.cpu_flags.bitfield.cpusse4_2)
8540         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8541       if (i.tm.cpu_flags.bitfield.cpuavx)
8542         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8543       if (i.tm.cpu_flags.bitfield.cpuavx2)
8544         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8545       if (i.tm.cpu_flags.bitfield.cpufma)
8546         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8547       if (i.tm.cpu_flags.bitfield.cpuavx512f)
8548         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8549       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8550         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8551       if (i.tm.cpu_flags.bitfield.cpuavx512er)
8552         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8553       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8554         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8555       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8556         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8557       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8558         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8559       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8560         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8561       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8562         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8563       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8564         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8565       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8566         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8567       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8568         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8569       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8570         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8571       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8572         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8573       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8574         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8575       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8576         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8577
8578       if (i.tm.cpu_flags.bitfield.cpu8087
8579           || i.tm.cpu_flags.bitfield.cpu287
8580           || i.tm.cpu_flags.bitfield.cpu387
8581           || i.tm.cpu_flags.bitfield.cpu687
8582           || i.tm.cpu_flags.bitfield.cpufisttp)
8583         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8584       if (i.has_regmmx
8585           || i.tm.base_opcode == 0xf77 /* emms */
8586           || i.tm.base_opcode == 0xf0e /* femms */)
8587         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8588       if (i.has_regxmm)
8589         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8590       if (i.has_regymm)
8591         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8592       if (i.has_regzmm)
8593         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8594       if (i.tm.cpu_flags.bitfield.cpufxsr)
8595         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8596       if (i.tm.cpu_flags.bitfield.cpuxsave)
8597         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8598       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8599         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8600       if (i.tm.cpu_flags.bitfield.cpuxsavec)
8601         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8602     }
8603 #endif
8604
8605   /* Tie dwarf2 debug info to the address at the start of the insn.
8606      We can't do this after the insn has been output as the current
8607      frag may have been closed off.  eg. by frag_var.  */
8608   dwarf2_emit_insn (0);
8609
8610   insn_start_frag = frag_now;
8611   insn_start_off = frag_now_fix ();
8612
8613   if (add_branch_padding_frag_p (&branch))
8614     {
8615       char *p;
8616       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
8617       unsigned int max_branch_padding_size = 14;
8618
8619       /* Align section to boundary.  */
8620       record_alignment (now_seg, align_branch_power);
8621
8622       /* Make room for padding.  */
8623       frag_grow (max_branch_padding_size);
8624
8625       /* Start of the padding.  */
8626       p = frag_more (0);
8627
8628       fragP = frag_now;
8629
8630       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8631                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8632                 NULL, 0, p);
8633
8634       fragP->tc_frag_data.branch_type = branch;
8635       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8636     }
8637
8638   /* Output jumps.  */
8639   if (i.tm.opcode_modifier.jump == JUMP)
8640     output_branch ();
8641   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8642            || i.tm.opcode_modifier.jump == JUMP_DWORD)
8643     output_jump ();
8644   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8645     output_interseg_jump ();
8646   else
8647     {
8648       /* Output normal instructions here.  */
8649       char *p;
8650       unsigned char *q;
8651       unsigned int j;
8652       unsigned int prefix;
8653
8654       if (avoid_fence
8655           && (i.tm.base_opcode == 0xfaee8
8656               || i.tm.base_opcode == 0xfaef0
8657               || i.tm.base_opcode == 0xfaef8))
8658         {
8659           /* Encode lfence, mfence, and sfence as
8660              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
8661           offsetT val = 0x240483f0ULL;
8662           p = frag_more (5);
8663           md_number_to_chars (p, val, 5);
8664           return;
8665         }
8666
8667       /* Some processors fail on LOCK prefix. This options makes
8668          assembler ignore LOCK prefix and serves as a workaround.  */
8669       if (omit_lock_prefix)
8670         {
8671           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8672             return;
8673           i.prefix[LOCK_PREFIX] = 0;
8674         }
8675
8676       if (branch)
8677         /* Skip if this is a branch.  */
8678         ;
8679       else if (add_fused_jcc_padding_frag_p ())
8680         {
8681           /* Make room for padding.  */
8682           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8683           p = frag_more (0);
8684
8685           fragP = frag_now;
8686
8687           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8688                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8689                     NULL, 0, p);
8690
8691           fragP->tc_frag_data.branch_type = align_branch_fused;
8692           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8693         }
8694       else if (add_branch_prefix_frag_p ())
8695         {
8696           unsigned int max_prefix_size = align_branch_prefix_size;
8697
8698           /* Make room for padding.  */
8699           frag_grow (max_prefix_size);
8700           p = frag_more (0);
8701
8702           fragP = frag_now;
8703
8704           frag_var (rs_machine_dependent, max_prefix_size, 0,
8705                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8706                     NULL, 0, p);
8707
8708           fragP->tc_frag_data.max_bytes = max_prefix_size;
8709         }
8710
8711       /* Since the VEX/EVEX prefix contains the implicit prefix, we
8712          don't need the explicit prefix.  */
8713       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8714         {
8715           switch (i.tm.opcode_length)
8716             {
8717             case 3:
8718               if (i.tm.base_opcode & 0xff000000)
8719                 {
8720                   prefix = (i.tm.base_opcode >> 24) & 0xff;
8721                   if (!i.tm.cpu_flags.bitfield.cpupadlock
8722                       || prefix != REPE_PREFIX_OPCODE
8723                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8724                     add_prefix (prefix);
8725                 }
8726               break;
8727             case 2:
8728               if ((i.tm.base_opcode & 0xff0000) != 0)
8729                 {
8730                   prefix = (i.tm.base_opcode >> 16) & 0xff;
8731                   add_prefix (prefix);
8732                 }
8733               break;
8734             case 1:
8735               break;
8736             case 0:
8737               /* Check for pseudo prefixes.  */
8738               as_bad_where (insn_start_frag->fr_file,
8739                             insn_start_frag->fr_line,
8740                              _("pseudo prefix without instruction"));
8741               return;
8742             default:
8743               abort ();
8744             }
8745
8746 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8747           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8748              R_X86_64_GOTTPOFF relocation so that linker can safely
8749              perform IE->LE optimization.  A dummy REX_OPCODE prefix
8750              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
8751              relocation for GDesc -> IE/LE optimization.  */
8752           if (x86_elf_abi == X86_64_X32_ABI
8753               && i.operands == 2
8754               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8755                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
8756               && i.prefix[REX_PREFIX] == 0)
8757             add_prefix (REX_OPCODE);
8758 #endif
8759
8760           /* The prefix bytes.  */
8761           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8762             if (*q)
8763               FRAG_APPEND_1_CHAR (*q);
8764         }
8765       else
8766         {
8767           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8768             if (*q)
8769               switch (j)
8770                 {
8771                 case REX_PREFIX:
8772                   /* REX byte is encoded in VEX prefix.  */
8773                   break;
8774                 case SEG_PREFIX:
8775                 case ADDR_PREFIX:
8776                   FRAG_APPEND_1_CHAR (*q);
8777                   break;
8778                 default:
8779                   /* There should be no other prefixes for instructions
8780                      with VEX prefix.  */
8781                   abort ();
8782                 }
8783
8784           /* For EVEX instructions i.vrex should become 0 after
8785              build_evex_prefix.  For VEX instructions upper 16 registers
8786              aren't available, so VREX should be 0.  */
8787           if (i.vrex)
8788             abort ();
8789           /* Now the VEX prefix.  */
8790           p = frag_more (i.vex.length);
8791           for (j = 0; j < i.vex.length; j++)
8792             p[j] = i.vex.bytes[j];
8793         }
8794
8795       /* Now the opcode; be careful about word order here!  */
8796       if (i.tm.opcode_length == 1)
8797         {
8798           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8799         }
8800       else
8801         {
8802           switch (i.tm.opcode_length)
8803             {
8804             case 4:
8805               p = frag_more (4);
8806               *p++ = (i.tm.base_opcode >> 24) & 0xff;
8807               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8808               break;
8809             case 3:
8810               p = frag_more (3);
8811               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8812               break;
8813             case 2:
8814               p = frag_more (2);
8815               break;
8816             default:
8817               abort ();
8818               break;
8819             }
8820
8821           /* Put out high byte first: can't use md_number_to_chars!  */
8822           *p++ = (i.tm.base_opcode >> 8) & 0xff;
8823           *p = i.tm.base_opcode & 0xff;
8824         }
8825
8826       /* Now the modrm byte and sib byte (if present).  */
8827       if (i.tm.opcode_modifier.modrm)
8828         {
8829           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8830                                | i.rm.reg << 3
8831                                | i.rm.mode << 6));
8832           /* If i.rm.regmem == ESP (4)
8833              && i.rm.mode != (Register mode)
8834              && not 16 bit
8835              ==> need second modrm byte.  */
8836           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8837               && i.rm.mode != 3
8838               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8839             FRAG_APPEND_1_CHAR ((i.sib.base << 0
8840                                  | i.sib.index << 3
8841                                  | i.sib.scale << 6));
8842         }
8843
8844       if (i.disp_operands)
8845         output_disp (insn_start_frag, insn_start_off);
8846
8847       if (i.imm_operands)
8848         output_imm (insn_start_frag, insn_start_off);
8849
8850       /*
8851        * frag_now_fix () returning plain abs_section_offset when we're in the
8852        * absolute section, and abs_section_offset not getting updated as data
8853        * gets added to the frag breaks the logic below.
8854        */
8855       if (now_seg != absolute_section)
8856         {
8857           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8858           if (j > 15)
8859             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8860                      j);
8861           else if (fragP)
8862             {
8863               /* NB: Don't add prefix with GOTPC relocation since
8864                  output_disp() above depends on the fixed encoding
8865                  length.  Can't add prefix with TLS relocation since
8866                  it breaks TLS linker optimization.  */
8867               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8868               /* Prefix count on the current instruction.  */
8869               unsigned int count = i.vex.length;
8870               unsigned int k;
8871               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8872                 /* REX byte is encoded in VEX/EVEX prefix.  */
8873                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8874                   count++;
8875
8876               /* Count prefixes for extended opcode maps.  */
8877               if (!i.vex.length)
8878                 switch (i.tm.opcode_length)
8879                   {
8880                   case 3:
8881                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8882                       {
8883                         count++;
8884                         switch ((i.tm.base_opcode >> 8) & 0xff)
8885                           {
8886                           case 0x38:
8887                           case 0x3a:
8888                             count++;
8889                             break;
8890                           default:
8891                             break;
8892                           }
8893                       }
8894                     break;
8895                   case 2:
8896                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8897                       count++;
8898                     break;
8899                   case 1:
8900                     break;
8901                   default:
8902                     abort ();
8903                   }
8904
8905               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8906                   == BRANCH_PREFIX)
8907                 {
8908                   /* Set the maximum prefix size in BRANCH_PREFIX
8909                      frag.  */
8910                   if (fragP->tc_frag_data.max_bytes > max)
8911                     fragP->tc_frag_data.max_bytes = max;
8912                   if (fragP->tc_frag_data.max_bytes > count)
8913                     fragP->tc_frag_data.max_bytes -= count;
8914                   else
8915                     fragP->tc_frag_data.max_bytes = 0;
8916                 }
8917               else
8918                 {
8919                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
8920                      frag.  */
8921                   unsigned int max_prefix_size;
8922                   if (align_branch_prefix_size > max)
8923                     max_prefix_size = max;
8924                   else
8925                     max_prefix_size = align_branch_prefix_size;
8926                   if (max_prefix_size > count)
8927                     fragP->tc_frag_data.max_prefix_length
8928                       = max_prefix_size - count;
8929                 }
8930
8931               /* Use existing segment prefix if possible.  Use CS
8932                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
8933                  segment prefix with ESP/EBP base register and use DS
8934                  segment prefix without ESP/EBP base register.  */
8935               if (i.prefix[SEG_PREFIX])
8936                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8937               else if (flag_code == CODE_64BIT)
8938                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8939               else if (i.base_reg
8940                        && (i.base_reg->reg_num == 4
8941                            || i.base_reg->reg_num == 5))
8942                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8943               else
8944                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8945             }
8946         }
8947     }
8948
8949   /* NB: Don't work with COND_JUMP86 without i386.  */
8950   if (align_branch_power
8951       && now_seg != absolute_section
8952       && cpu_arch_flags.bitfield.cpui386)
8953     {
8954       /* Terminate each frag so that we can add prefix and check for
8955          fused jcc.  */
8956       frag_wane (frag_now);
8957       frag_new (0);
8958     }
8959
8960 #ifdef DEBUG386
8961   if (flag_debug)
8962     {
8963       pi ("" /*line*/, &i);
8964     }
8965 #endif /* DEBUG386  */
8966 }
8967
8968 /* Return the size of the displacement operand N.  */
8969
8970 static int
8971 disp_size (unsigned int n)
8972 {
8973   int size = 4;
8974
8975   if (i.types[n].bitfield.disp64)
8976     size = 8;
8977   else if (i.types[n].bitfield.disp8)
8978     size = 1;
8979   else if (i.types[n].bitfield.disp16)
8980     size = 2;
8981   return size;
8982 }
8983
8984 /* Return the size of the immediate operand N.  */
8985
8986 static int
8987 imm_size (unsigned int n)
8988 {
8989   int size = 4;
8990   if (i.types[n].bitfield.imm64)
8991     size = 8;
8992   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8993     size = 1;
8994   else if (i.types[n].bitfield.imm16)
8995     size = 2;
8996   return size;
8997 }
8998
8999 static void
9000 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9001 {
9002   char *p;
9003   unsigned int n;
9004
9005   for (n = 0; n < i.operands; n++)
9006     {
9007       if (operand_type_check (i.types[n], disp))
9008         {
9009           if (i.op[n].disps->X_op == O_constant)
9010             {
9011               int size = disp_size (n);
9012               offsetT val = i.op[n].disps->X_add_number;
9013
9014               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9015                                      size);
9016               p = frag_more (size);
9017               md_number_to_chars (p, val, size);
9018             }
9019           else
9020             {
9021               enum bfd_reloc_code_real reloc_type;
9022               int size = disp_size (n);
9023               int sign = i.types[n].bitfield.disp32s;
9024               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9025               fixS *fixP;
9026
9027               /* We can't have 8 bit displacement here.  */
9028               gas_assert (!i.types[n].bitfield.disp8);
9029
9030               /* The PC relative address is computed relative
9031                  to the instruction boundary, so in case immediate
9032                  fields follows, we need to adjust the value.  */
9033               if (pcrel && i.imm_operands)
9034                 {
9035                   unsigned int n1;
9036                   int sz = 0;
9037
9038                   for (n1 = 0; n1 < i.operands; n1++)
9039                     if (operand_type_check (i.types[n1], imm))
9040                       {
9041                         /* Only one immediate is allowed for PC
9042                            relative address.  */
9043                         gas_assert (sz == 0);
9044                         sz = imm_size (n1);
9045                         i.op[n].disps->X_add_number -= sz;
9046                       }
9047                   /* We should find the immediate.  */
9048                   gas_assert (sz != 0);
9049                 }
9050
9051               p = frag_more (size);
9052               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9053               if (GOT_symbol
9054                   && GOT_symbol == i.op[n].disps->X_add_symbol
9055                   && (((reloc_type == BFD_RELOC_32
9056                         || reloc_type == BFD_RELOC_X86_64_32S
9057                         || (reloc_type == BFD_RELOC_64
9058                             && object_64bit))
9059                        && (i.op[n].disps->X_op == O_symbol
9060                            || (i.op[n].disps->X_op == O_add
9061                                && ((symbol_get_value_expression
9062                                     (i.op[n].disps->X_op_symbol)->X_op)
9063                                    == O_subtract))))
9064                       || reloc_type == BFD_RELOC_32_PCREL))
9065                 {
9066                   if (!object_64bit)
9067                     {
9068                       reloc_type = BFD_RELOC_386_GOTPC;
9069                       i.has_gotpc_tls_reloc = TRUE;
9070                       i.op[n].imms->X_add_number +=
9071                         encoding_length (insn_start_frag, insn_start_off, p);
9072                     }
9073                   else if (reloc_type == BFD_RELOC_64)
9074                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9075                   else
9076                     /* Don't do the adjustment for x86-64, as there
9077                        the pcrel addressing is relative to the _next_
9078                        insn, and that is taken care of in other code.  */
9079                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9080                 }
9081               else if (align_branch_power)
9082                 {
9083                   switch (reloc_type)
9084                     {
9085                     case BFD_RELOC_386_TLS_GD:
9086                     case BFD_RELOC_386_TLS_LDM:
9087                     case BFD_RELOC_386_TLS_IE:
9088                     case BFD_RELOC_386_TLS_IE_32:
9089                     case BFD_RELOC_386_TLS_GOTIE:
9090                     case BFD_RELOC_386_TLS_GOTDESC:
9091                     case BFD_RELOC_386_TLS_DESC_CALL:
9092                     case BFD_RELOC_X86_64_TLSGD:
9093                     case BFD_RELOC_X86_64_TLSLD:
9094                     case BFD_RELOC_X86_64_GOTTPOFF:
9095                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9096                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9097                       i.has_gotpc_tls_reloc = TRUE;
9098                     default:
9099                       break;
9100                     }
9101                 }
9102               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9103                                   size, i.op[n].disps, pcrel,
9104                                   reloc_type);
9105               /* Check for "call/jmp *mem", "mov mem, %reg",
9106                  "test %reg, mem" and "binop mem, %reg" where binop
9107                  is one of adc, add, and, cmp, or, sbb, sub, xor
9108                  instructions without data prefix.  Always generate
9109                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9110               if (i.prefix[DATA_PREFIX] == 0
9111                   && (generate_relax_relocations
9112                       || (!object_64bit
9113                           && i.rm.mode == 0
9114                           && i.rm.regmem == 5))
9115                   && (i.rm.mode == 2
9116                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9117                   && !is_any_vex_encoding(&i.tm)
9118                   && ((i.operands == 1
9119                        && i.tm.base_opcode == 0xff
9120                        && (i.rm.reg == 2 || i.rm.reg == 4))
9121                       || (i.operands == 2
9122                           && (i.tm.base_opcode == 0x8b
9123                               || i.tm.base_opcode == 0x85
9124                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9125                 {
9126                   if (object_64bit)
9127                     {
9128                       fixP->fx_tcbit = i.rex != 0;
9129                       if (i.base_reg
9130                           && (i.base_reg->reg_num == RegIP))
9131                       fixP->fx_tcbit2 = 1;
9132                     }
9133                   else
9134                     fixP->fx_tcbit2 = 1;
9135                 }
9136             }
9137         }
9138     }
9139 }
9140
9141 static void
9142 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9143 {
9144   char *p;
9145   unsigned int n;
9146
9147   for (n = 0; n < i.operands; n++)
9148     {
9149       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9150       if (i.rounding && (int) n == i.rounding->operand)
9151         continue;
9152
9153       if (operand_type_check (i.types[n], imm))
9154         {
9155           if (i.op[n].imms->X_op == O_constant)
9156             {
9157               int size = imm_size (n);
9158               offsetT val;
9159
9160               val = offset_in_range (i.op[n].imms->X_add_number,
9161                                      size);
9162               p = frag_more (size);
9163               md_number_to_chars (p, val, size);
9164             }
9165           else
9166             {
9167               /* Not absolute_section.
9168                  Need a 32-bit fixup (don't support 8bit
9169                  non-absolute imms).  Try to support other
9170                  sizes ...  */
9171               enum bfd_reloc_code_real reloc_type;
9172               int size = imm_size (n);
9173               int sign;
9174
9175               if (i.types[n].bitfield.imm32s
9176                   && (i.suffix == QWORD_MNEM_SUFFIX
9177                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9178                 sign = 1;
9179               else
9180                 sign = 0;
9181
9182               p = frag_more (size);
9183               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9184
9185               /*   This is tough to explain.  We end up with this one if we
9186                * have operands that look like
9187                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9188                * obtain the absolute address of the GOT, and it is strongly
9189                * preferable from a performance point of view to avoid using
9190                * a runtime relocation for this.  The actual sequence of
9191                * instructions often look something like:
9192                *
9193                *        call    .L66
9194                * .L66:
9195                *        popl    %ebx
9196                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9197                *
9198                *   The call and pop essentially return the absolute address
9199                * of the label .L66 and store it in %ebx.  The linker itself
9200                * will ultimately change the first operand of the addl so
9201                * that %ebx points to the GOT, but to keep things simple, the
9202                * .o file must have this operand set so that it generates not
9203                * the absolute address of .L66, but the absolute address of
9204                * itself.  This allows the linker itself simply treat a GOTPC
9205                * relocation as asking for a pcrel offset to the GOT to be
9206                * added in, and the addend of the relocation is stored in the
9207                * operand field for the instruction itself.
9208                *
9209                *   Our job here is to fix the operand so that it would add
9210                * the correct offset so that %ebx would point to itself.  The
9211                * thing that is tricky is that .-.L66 will point to the
9212                * beginning of the instruction, so we need to further modify
9213                * the operand so that it will point to itself.  There are
9214                * other cases where you have something like:
9215                *
9216                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9217                *
9218                * and here no correction would be required.  Internally in
9219                * the assembler we treat operands of this form as not being
9220                * pcrel since the '.' is explicitly mentioned, and I wonder
9221                * whether it would simplify matters to do it this way.  Who
9222                * knows.  In earlier versions of the PIC patches, the
9223                * pcrel_adjust field was used to store the correction, but
9224                * since the expression is not pcrel, I felt it would be
9225                * confusing to do it this way.  */
9226
9227               if ((reloc_type == BFD_RELOC_32
9228                    || reloc_type == BFD_RELOC_X86_64_32S
9229                    || reloc_type == BFD_RELOC_64)
9230                   && GOT_symbol
9231                   && GOT_symbol == i.op[n].imms->X_add_symbol
9232                   && (i.op[n].imms->X_op == O_symbol
9233                       || (i.op[n].imms->X_op == O_add
9234                           && ((symbol_get_value_expression
9235                                (i.op[n].imms->X_op_symbol)->X_op)
9236                               == O_subtract))))
9237                 {
9238                   if (!object_64bit)
9239                     reloc_type = BFD_RELOC_386_GOTPC;
9240                   else if (size == 4)
9241                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9242                   else if (size == 8)
9243                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9244                   i.has_gotpc_tls_reloc = TRUE;
9245                   i.op[n].imms->X_add_number +=
9246                     encoding_length (insn_start_frag, insn_start_off, p);
9247                 }
9248               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9249                            i.op[n].imms, 0, reloc_type);
9250             }
9251         }
9252     }
9253 }
9254 \f
9255 /* x86_cons_fix_new is called via the expression parsing code when a
9256    reloc is needed.  We use this hook to get the correct .got reloc.  */
9257 static int cons_sign = -1;
9258
9259 void
9260 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9261                   expressionS *exp, bfd_reloc_code_real_type r)
9262 {
9263   r = reloc (len, 0, cons_sign, r);
9264
9265 #ifdef TE_PE
9266   if (exp->X_op == O_secrel)
9267     {
9268       exp->X_op = O_symbol;
9269       r = BFD_RELOC_32_SECREL;
9270     }
9271 #endif
9272
9273   fix_new_exp (frag, off, len, exp, 0, r);
9274 }
9275
9276 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9277    purpose of the `.dc.a' internal pseudo-op.  */
9278
9279 int
9280 x86_address_bytes (void)
9281 {
9282   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9283     return 4;
9284   return stdoutput->arch_info->bits_per_address / 8;
9285 }
9286
9287 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9288     || defined (LEX_AT)
9289 # define lex_got(reloc, adjust, types) NULL
9290 #else
9291 /* Parse operands of the form
9292    <symbol>@GOTOFF+<nnn>
9293    and similar .plt or .got references.
9294
9295    If we find one, set up the correct relocation in RELOC and copy the
9296    input string, minus the `@GOTOFF' into a malloc'd buffer for
9297    parsing by the calling routine.  Return this buffer, and if ADJUST
9298    is non-null set it to the length of the string we removed from the
9299    input line.  Otherwise return NULL.  */
9300 static char *
9301 lex_got (enum bfd_reloc_code_real *rel,
9302          int *adjust,
9303          i386_operand_type *types)
9304 {
9305   /* Some of the relocations depend on the size of what field is to
9306      be relocated.  But in our callers i386_immediate and i386_displacement
9307      we don't yet know the operand size (this will be set by insn
9308      matching).  Hence we record the word32 relocation here,
9309      and adjust the reloc according to the real size in reloc().  */
9310   static const struct {
9311     const char *str;
9312     int len;
9313     const enum bfd_reloc_code_real rel[2];
9314     const i386_operand_type types64;
9315   } gotrel[] = {
9316 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9317     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9318                                         BFD_RELOC_SIZE32 },
9319       OPERAND_TYPE_IMM32_64 },
9320 #endif
9321     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9322                                        BFD_RELOC_X86_64_PLTOFF64 },
9323       OPERAND_TYPE_IMM64 },
9324     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9325                                        BFD_RELOC_X86_64_PLT32    },
9326       OPERAND_TYPE_IMM32_32S_DISP32 },
9327     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9328                                        BFD_RELOC_X86_64_GOTPLT64 },
9329       OPERAND_TYPE_IMM64_DISP64 },
9330     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9331                                        BFD_RELOC_X86_64_GOTOFF64 },
9332       OPERAND_TYPE_IMM64_DISP64 },
9333     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9334                                        BFD_RELOC_X86_64_GOTPCREL },
9335       OPERAND_TYPE_IMM32_32S_DISP32 },
9336     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9337                                        BFD_RELOC_X86_64_TLSGD    },
9338       OPERAND_TYPE_IMM32_32S_DISP32 },
9339     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9340                                        _dummy_first_bfd_reloc_code_real },
9341       OPERAND_TYPE_NONE },
9342     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9343                                        BFD_RELOC_X86_64_TLSLD    },
9344       OPERAND_TYPE_IMM32_32S_DISP32 },
9345     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9346                                        BFD_RELOC_X86_64_GOTTPOFF },
9347       OPERAND_TYPE_IMM32_32S_DISP32 },
9348     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9349                                        BFD_RELOC_X86_64_TPOFF32  },
9350       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9351     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9352                                        _dummy_first_bfd_reloc_code_real },
9353       OPERAND_TYPE_NONE },
9354     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9355                                        BFD_RELOC_X86_64_DTPOFF32 },
9356       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9357     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9358                                        _dummy_first_bfd_reloc_code_real },
9359       OPERAND_TYPE_NONE },
9360     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9361                                        _dummy_first_bfd_reloc_code_real },
9362       OPERAND_TYPE_NONE },
9363     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9364                                        BFD_RELOC_X86_64_GOT32    },
9365       OPERAND_TYPE_IMM32_32S_64_DISP32 },
9366     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
9367                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9368       OPERAND_TYPE_IMM32_32S_DISP32 },
9369     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
9370                                        BFD_RELOC_X86_64_TLSDESC_CALL },
9371       OPERAND_TYPE_IMM32_32S_DISP32 },
9372   };
9373   char *cp;
9374   unsigned int j;
9375
9376 #if defined (OBJ_MAYBE_ELF)
9377   if (!IS_ELF)
9378     return NULL;
9379 #endif
9380
9381   for (cp = input_line_pointer; *cp != '@'; cp++)
9382     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9383       return NULL;
9384
9385   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9386     {
9387       int len = gotrel[j].len;
9388       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9389         {
9390           if (gotrel[j].rel[object_64bit] != 0)
9391             {
9392               int first, second;
9393               char *tmpbuf, *past_reloc;
9394
9395               *rel = gotrel[j].rel[object_64bit];
9396
9397               if (types)
9398                 {
9399                   if (flag_code != CODE_64BIT)
9400                     {
9401                       types->bitfield.imm32 = 1;
9402                       types->bitfield.disp32 = 1;
9403                     }
9404                   else
9405                     *types = gotrel[j].types64;
9406                 }
9407
9408               if (j != 0 && GOT_symbol == NULL)
9409                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9410
9411               /* The length of the first part of our input line.  */
9412               first = cp - input_line_pointer;
9413
9414               /* The second part goes from after the reloc token until
9415                  (and including) an end_of_line char or comma.  */
9416               past_reloc = cp + 1 + len;
9417               cp = past_reloc;
9418               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9419                 ++cp;
9420               second = cp + 1 - past_reloc;
9421
9422               /* Allocate and copy string.  The trailing NUL shouldn't
9423                  be necessary, but be safe.  */
9424               tmpbuf = XNEWVEC (char, first + second + 2);
9425               memcpy (tmpbuf, input_line_pointer, first);
9426               if (second != 0 && *past_reloc != ' ')
9427                 /* Replace the relocation token with ' ', so that
9428                    errors like foo@GOTOFF1 will be detected.  */
9429                 tmpbuf[first++] = ' ';
9430               else
9431                 /* Increment length by 1 if the relocation token is
9432                    removed.  */
9433                 len++;
9434               if (adjust)
9435                 *adjust = len;
9436               memcpy (tmpbuf + first, past_reloc, second);
9437               tmpbuf[first + second] = '\0';
9438               return tmpbuf;
9439             }
9440
9441           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9442                   gotrel[j].str, 1 << (5 + object_64bit));
9443           return NULL;
9444         }
9445     }
9446
9447   /* Might be a symbol version string.  Don't as_bad here.  */
9448   return NULL;
9449 }
9450 #endif
9451
9452 #ifdef TE_PE
9453 #ifdef lex_got
9454 #undef lex_got
9455 #endif
9456 /* Parse operands of the form
9457    <symbol>@SECREL32+<nnn>
9458
9459    If we find one, set up the correct relocation in RELOC and copy the
9460    input string, minus the `@SECREL32' into a malloc'd buffer for
9461    parsing by the calling routine.  Return this buffer, and if ADJUST
9462    is non-null set it to the length of the string we removed from the
9463    input line.  Otherwise return NULL.
9464
9465    This function is copied from the ELF version above adjusted for PE targets.  */
9466
9467 static char *
9468 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9469          int *adjust ATTRIBUTE_UNUSED,
9470          i386_operand_type *types)
9471 {
9472   static const struct
9473   {
9474     const char *str;
9475     int len;
9476     const enum bfd_reloc_code_real rel[2];
9477     const i386_operand_type types64;
9478   }
9479   gotrel[] =
9480   {
9481     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
9482                                           BFD_RELOC_32_SECREL },
9483       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9484   };
9485
9486   char *cp;
9487   unsigned j;
9488
9489   for (cp = input_line_pointer; *cp != '@'; cp++)
9490     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9491       return NULL;
9492
9493   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9494     {
9495       int len = gotrel[j].len;
9496
9497       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9498         {
9499           if (gotrel[j].rel[object_64bit] != 0)
9500             {
9501               int first, second;
9502               char *tmpbuf, *past_reloc;
9503
9504               *rel = gotrel[j].rel[object_64bit];
9505               if (adjust)
9506                 *adjust = len;
9507
9508               if (types)
9509                 {
9510                   if (flag_code != CODE_64BIT)
9511                     {
9512                       types->bitfield.imm32 = 1;
9513                       types->bitfield.disp32 = 1;
9514                     }
9515                   else
9516                     *types = gotrel[j].types64;
9517                 }
9518
9519               /* The length of the first part of our input line.  */
9520               first = cp - input_line_pointer;
9521
9522               /* The second part goes from after the reloc token until
9523                  (and including) an end_of_line char or comma.  */
9524               past_reloc = cp + 1 + len;
9525               cp = past_reloc;
9526               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9527                 ++cp;
9528               second = cp + 1 - past_reloc;
9529
9530               /* Allocate and copy string.  The trailing NUL shouldn't
9531                  be necessary, but be safe.  */
9532               tmpbuf = XNEWVEC (char, first + second + 2);
9533               memcpy (tmpbuf, input_line_pointer, first);
9534               if (second != 0 && *past_reloc != ' ')
9535                 /* Replace the relocation token with ' ', so that
9536                    errors like foo@SECLREL321 will be detected.  */
9537                 tmpbuf[first++] = ' ';
9538               memcpy (tmpbuf + first, past_reloc, second);
9539               tmpbuf[first + second] = '\0';
9540               return tmpbuf;
9541             }
9542
9543           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9544                   gotrel[j].str, 1 << (5 + object_64bit));
9545           return NULL;
9546         }
9547     }
9548
9549   /* Might be a symbol version string.  Don't as_bad here.  */
9550   return NULL;
9551 }
9552
9553 #endif /* TE_PE */
9554
9555 bfd_reloc_code_real_type
9556 x86_cons (expressionS *exp, int size)
9557 {
9558   bfd_reloc_code_real_type got_reloc = NO_RELOC;
9559
9560   intel_syntax = -intel_syntax;
9561
9562   exp->X_md = 0;
9563   if (size == 4 || (object_64bit && size == 8))
9564     {
9565       /* Handle @GOTOFF and the like in an expression.  */
9566       char *save;
9567       char *gotfree_input_line;
9568       int adjust = 0;
9569
9570       save = input_line_pointer;
9571       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9572       if (gotfree_input_line)
9573         input_line_pointer = gotfree_input_line;
9574
9575       expression (exp);
9576
9577       if (gotfree_input_line)
9578         {
9579           /* expression () has merrily parsed up to the end of line,
9580              or a comma - in the wrong buffer.  Transfer how far
9581              input_line_pointer has moved to the right buffer.  */
9582           input_line_pointer = (save
9583                                 + (input_line_pointer - gotfree_input_line)
9584                                 + adjust);
9585           free (gotfree_input_line);
9586           if (exp->X_op == O_constant
9587               || exp->X_op == O_absent
9588               || exp->X_op == O_illegal
9589               || exp->X_op == O_register
9590               || exp->X_op == O_big)
9591             {
9592               char c = *input_line_pointer;
9593               *input_line_pointer = 0;
9594               as_bad (_("missing or invalid expression `%s'"), save);
9595               *input_line_pointer = c;
9596             }
9597           else if ((got_reloc == BFD_RELOC_386_PLT32
9598                     || got_reloc == BFD_RELOC_X86_64_PLT32)
9599                    && exp->X_op != O_symbol)
9600             {
9601               char c = *input_line_pointer;
9602               *input_line_pointer = 0;
9603               as_bad (_("invalid PLT expression `%s'"), save);
9604               *input_line_pointer = c;
9605             }
9606         }
9607     }
9608   else
9609     expression (exp);
9610
9611   intel_syntax = -intel_syntax;
9612
9613   if (intel_syntax)
9614     i386_intel_simplify (exp);
9615
9616   return got_reloc;
9617 }
9618
9619 static void
9620 signed_cons (int size)
9621 {
9622   if (flag_code == CODE_64BIT)
9623     cons_sign = 1;
9624   cons (size);
9625   cons_sign = -1;
9626 }
9627
9628 #ifdef TE_PE
9629 static void
9630 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9631 {
9632   expressionS exp;
9633
9634   do
9635     {
9636       expression (&exp);
9637       if (exp.X_op == O_symbol)
9638         exp.X_op = O_secrel;
9639
9640       emit_expr (&exp, 4);
9641     }
9642   while (*input_line_pointer++ == ',');
9643
9644   input_line_pointer--;
9645   demand_empty_rest_of_line ();
9646 }
9647 #endif
9648
9649 /* Handle Vector operations.  */
9650
9651 static char *
9652 check_VecOperations (char *op_string, char *op_end)
9653 {
9654   const reg_entry *mask;
9655   const char *saved;
9656   char *end_op;
9657
9658   while (*op_string
9659          && (op_end == NULL || op_string < op_end))
9660     {
9661       saved = op_string;
9662       if (*op_string == '{')
9663         {
9664           op_string++;
9665
9666           /* Check broadcasts.  */
9667           if (strncmp (op_string, "1to", 3) == 0)
9668             {
9669               int bcst_type;
9670
9671               if (i.broadcast)
9672                 goto duplicated_vec_op;
9673
9674               op_string += 3;
9675               if (*op_string == '8')
9676                 bcst_type = 8;
9677               else if (*op_string == '4')
9678                 bcst_type = 4;
9679               else if (*op_string == '2')
9680                 bcst_type = 2;
9681               else if (*op_string == '1'
9682                        && *(op_string+1) == '6')
9683                 {
9684                   bcst_type = 16;
9685                   op_string++;
9686                 }
9687               else
9688                 {
9689                   as_bad (_("Unsupported broadcast: `%s'"), saved);
9690                   return NULL;
9691                 }
9692               op_string++;
9693
9694               broadcast_op.type = bcst_type;
9695               broadcast_op.operand = this_operand;
9696               broadcast_op.bytes = 0;
9697               i.broadcast = &broadcast_op;
9698             }
9699           /* Check masking operation.  */
9700           else if ((mask = parse_register (op_string, &end_op)) != NULL)
9701             {
9702               /* k0 can't be used for write mask.  */
9703               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9704                 {
9705                   as_bad (_("`%s%s' can't be used for write mask"),
9706                           register_prefix, mask->reg_name);
9707                   return NULL;
9708                 }
9709
9710               if (!i.mask)
9711                 {
9712                   mask_op.mask = mask;
9713                   mask_op.zeroing = 0;
9714                   mask_op.operand = this_operand;
9715                   i.mask = &mask_op;
9716                 }
9717               else
9718                 {
9719                   if (i.mask->mask)
9720                     goto duplicated_vec_op;
9721
9722                   i.mask->mask = mask;
9723
9724                   /* Only "{z}" is allowed here.  No need to check
9725                      zeroing mask explicitly.  */
9726                   if (i.mask->operand != this_operand)
9727                     {
9728                       as_bad (_("invalid write mask `%s'"), saved);
9729                       return NULL;
9730                     }
9731                 }
9732
9733               op_string = end_op;
9734             }
9735           /* Check zeroing-flag for masking operation.  */
9736           else if (*op_string == 'z')
9737             {
9738               if (!i.mask)
9739                 {
9740                   mask_op.mask = NULL;
9741                   mask_op.zeroing = 1;
9742                   mask_op.operand = this_operand;
9743                   i.mask = &mask_op;
9744                 }
9745               else
9746                 {
9747                   if (i.mask->zeroing)
9748                     {
9749                     duplicated_vec_op:
9750                       as_bad (_("duplicated `%s'"), saved);
9751                       return NULL;
9752                     }
9753
9754                   i.mask->zeroing = 1;
9755
9756                   /* Only "{%k}" is allowed here.  No need to check mask
9757                      register explicitly.  */
9758                   if (i.mask->operand != this_operand)
9759                     {
9760                       as_bad (_("invalid zeroing-masking `%s'"),
9761                               saved);
9762                       return NULL;
9763                     }
9764                 }
9765
9766               op_string++;
9767             }
9768           else
9769             goto unknown_vec_op;
9770
9771           if (*op_string != '}')
9772             {
9773               as_bad (_("missing `}' in `%s'"), saved);
9774               return NULL;
9775             }
9776           op_string++;
9777
9778           /* Strip whitespace since the addition of pseudo prefixes
9779              changed how the scrubber treats '{'.  */
9780           if (is_space_char (*op_string))
9781             ++op_string;
9782
9783           continue;
9784         }
9785     unknown_vec_op:
9786       /* We don't know this one.  */
9787       as_bad (_("unknown vector operation: `%s'"), saved);
9788       return NULL;
9789     }
9790
9791   if (i.mask && i.mask->zeroing && !i.mask->mask)
9792     {
9793       as_bad (_("zeroing-masking only allowed with write mask"));
9794       return NULL;
9795     }
9796
9797   return op_string;
9798 }
9799
9800 static int
9801 i386_immediate (char *imm_start)
9802 {
9803   char *save_input_line_pointer;
9804   char *gotfree_input_line;
9805   segT exp_seg = 0;
9806   expressionS *exp;
9807   i386_operand_type types;
9808
9809   operand_type_set (&types, ~0);
9810
9811   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9812     {
9813       as_bad (_("at most %d immediate operands are allowed"),
9814               MAX_IMMEDIATE_OPERANDS);
9815       return 0;
9816     }
9817
9818   exp = &im_expressions[i.imm_operands++];
9819   i.op[this_operand].imms = exp;
9820
9821   if (is_space_char (*imm_start))
9822     ++imm_start;
9823
9824   save_input_line_pointer = input_line_pointer;
9825   input_line_pointer = imm_start;
9826
9827   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9828   if (gotfree_input_line)
9829     input_line_pointer = gotfree_input_line;
9830
9831   exp_seg = expression (exp);
9832
9833   SKIP_WHITESPACE ();
9834
9835   /* Handle vector operations.  */
9836   if (*input_line_pointer == '{')
9837     {
9838       input_line_pointer = check_VecOperations (input_line_pointer,
9839                                                 NULL);
9840       if (input_line_pointer == NULL)
9841         return 0;
9842     }
9843
9844   if (*input_line_pointer)
9845     as_bad (_("junk `%s' after expression"), input_line_pointer);
9846
9847   input_line_pointer = save_input_line_pointer;
9848   if (gotfree_input_line)
9849     {
9850       free (gotfree_input_line);
9851
9852       if (exp->X_op == O_constant || exp->X_op == O_register)
9853         exp->X_op = O_illegal;
9854     }
9855
9856   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9857 }
9858
9859 static int
9860 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9861                          i386_operand_type types, const char *imm_start)
9862 {
9863   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9864     {
9865       if (imm_start)
9866         as_bad (_("missing or invalid immediate expression `%s'"),
9867                 imm_start);
9868       return 0;
9869     }
9870   else if (exp->X_op == O_constant)
9871     {
9872       /* Size it properly later.  */
9873       i.types[this_operand].bitfield.imm64 = 1;
9874       /* If not 64bit, sign extend val.  */
9875       if (flag_code != CODE_64BIT
9876           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9877         exp->X_add_number
9878           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9879     }
9880 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9881   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9882            && exp_seg != absolute_section
9883            && exp_seg != text_section
9884            && exp_seg != data_section
9885            && exp_seg != bss_section
9886            && exp_seg != undefined_section
9887            && !bfd_is_com_section (exp_seg))
9888     {
9889       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9890       return 0;
9891     }
9892 #endif
9893   else if (!intel_syntax && exp_seg == reg_section)
9894     {
9895       if (imm_start)
9896         as_bad (_("illegal immediate register operand %s"), imm_start);
9897       return 0;
9898     }
9899   else
9900     {
9901       /* This is an address.  The size of the address will be
9902          determined later, depending on destination register,
9903          suffix, or the default for the section.  */
9904       i.types[this_operand].bitfield.imm8 = 1;
9905       i.types[this_operand].bitfield.imm16 = 1;
9906       i.types[this_operand].bitfield.imm32 = 1;
9907       i.types[this_operand].bitfield.imm32s = 1;
9908       i.types[this_operand].bitfield.imm64 = 1;
9909       i.types[this_operand] = operand_type_and (i.types[this_operand],
9910                                                 types);
9911     }
9912
9913   return 1;
9914 }
9915
9916 static char *
9917 i386_scale (char *scale)
9918 {
9919   offsetT val;
9920   char *save = input_line_pointer;
9921
9922   input_line_pointer = scale;
9923   val = get_absolute_expression ();
9924
9925   switch (val)
9926     {
9927     case 1:
9928       i.log2_scale_factor = 0;
9929       break;
9930     case 2:
9931       i.log2_scale_factor = 1;
9932       break;
9933     case 4:
9934       i.log2_scale_factor = 2;
9935       break;
9936     case 8:
9937       i.log2_scale_factor = 3;
9938       break;
9939     default:
9940       {
9941         char sep = *input_line_pointer;
9942
9943         *input_line_pointer = '\0';
9944         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9945                 scale);
9946         *input_line_pointer = sep;
9947         input_line_pointer = save;
9948         return NULL;
9949       }
9950     }
9951   if (i.log2_scale_factor != 0 && i.index_reg == 0)
9952     {
9953       as_warn (_("scale factor of %d without an index register"),
9954                1 << i.log2_scale_factor);
9955       i.log2_scale_factor = 0;
9956     }
9957   scale = input_line_pointer;
9958   input_line_pointer = save;
9959   return scale;
9960 }
9961
9962 static int
9963 i386_displacement (char *disp_start, char *disp_end)
9964 {
9965   expressionS *exp;
9966   segT exp_seg = 0;
9967   char *save_input_line_pointer;
9968   char *gotfree_input_line;
9969   int override;
9970   i386_operand_type bigdisp, types = anydisp;
9971   int ret;
9972
9973   if (i.disp_operands == MAX_MEMORY_OPERANDS)
9974     {
9975       as_bad (_("at most %d displacement operands are allowed"),
9976               MAX_MEMORY_OPERANDS);
9977       return 0;
9978     }
9979
9980   operand_type_set (&bigdisp, 0);
9981   if (i.jumpabsolute
9982       || i.types[this_operand].bitfield.baseindex
9983       || (current_templates->start->opcode_modifier.jump != JUMP
9984           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9985     {
9986       i386_addressing_mode ();
9987       override = (i.prefix[ADDR_PREFIX] != 0);
9988       if (flag_code == CODE_64BIT)
9989         {
9990           if (!override)
9991             {
9992               bigdisp.bitfield.disp32s = 1;
9993               bigdisp.bitfield.disp64 = 1;
9994             }
9995           else
9996             bigdisp.bitfield.disp32 = 1;
9997         }
9998       else if ((flag_code == CODE_16BIT) ^ override)
9999           bigdisp.bitfield.disp16 = 1;
10000       else
10001           bigdisp.bitfield.disp32 = 1;
10002     }
10003   else
10004     {
10005       /* For PC-relative branches, the width of the displacement may be
10006          dependent upon data size, but is never dependent upon address size.
10007          Also make sure to not unintentionally match against a non-PC-relative
10008          branch template.  */
10009       static templates aux_templates;
10010       const insn_template *t = current_templates->start;
10011       bfd_boolean has_intel64 = FALSE;
10012
10013       aux_templates.start = t;
10014       while (++t < current_templates->end)
10015         {
10016           if (t->opcode_modifier.jump
10017               != current_templates->start->opcode_modifier.jump)
10018             break;
10019           if ((t->opcode_modifier.isa64 >= INTEL64))
10020             has_intel64 = TRUE;
10021         }
10022       if (t < current_templates->end)
10023         {
10024           aux_templates.end = t;
10025           current_templates = &aux_templates;
10026         }
10027
10028       override = (i.prefix[DATA_PREFIX] != 0);
10029       if (flag_code == CODE_64BIT)
10030         {
10031           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10032               && (!intel64 || !has_intel64))
10033             bigdisp.bitfield.disp16 = 1;
10034           else
10035             bigdisp.bitfield.disp32s = 1;
10036         }
10037       else
10038         {
10039           if (!override)
10040             override = (i.suffix == (flag_code != CODE_16BIT
10041                                      ? WORD_MNEM_SUFFIX
10042                                      : LONG_MNEM_SUFFIX));
10043           bigdisp.bitfield.disp32 = 1;
10044           if ((flag_code == CODE_16BIT) ^ override)
10045             {
10046               bigdisp.bitfield.disp32 = 0;
10047               bigdisp.bitfield.disp16 = 1;
10048             }
10049         }
10050     }
10051   i.types[this_operand] = operand_type_or (i.types[this_operand],
10052                                            bigdisp);
10053
10054   exp = &disp_expressions[i.disp_operands];
10055   i.op[this_operand].disps = exp;
10056   i.disp_operands++;
10057   save_input_line_pointer = input_line_pointer;
10058   input_line_pointer = disp_start;
10059   END_STRING_AND_SAVE (disp_end);
10060
10061 #ifndef GCC_ASM_O_HACK
10062 #define GCC_ASM_O_HACK 0
10063 #endif
10064 #if GCC_ASM_O_HACK
10065   END_STRING_AND_SAVE (disp_end + 1);
10066   if (i.types[this_operand].bitfield.baseIndex
10067       && displacement_string_end[-1] == '+')
10068     {
10069       /* This hack is to avoid a warning when using the "o"
10070          constraint within gcc asm statements.
10071          For instance:
10072
10073          #define _set_tssldt_desc(n,addr,limit,type) \
10074          __asm__ __volatile__ ( \
10075          "movw %w2,%0\n\t" \
10076          "movw %w1,2+%0\n\t" \
10077          "rorl $16,%1\n\t" \
10078          "movb %b1,4+%0\n\t" \
10079          "movb %4,5+%0\n\t" \
10080          "movb $0,6+%0\n\t" \
10081          "movb %h1,7+%0\n\t" \
10082          "rorl $16,%1" \
10083          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10084
10085          This works great except that the output assembler ends
10086          up looking a bit weird if it turns out that there is
10087          no offset.  You end up producing code that looks like:
10088
10089          #APP
10090          movw $235,(%eax)
10091          movw %dx,2+(%eax)
10092          rorl $16,%edx
10093          movb %dl,4+(%eax)
10094          movb $137,5+(%eax)
10095          movb $0,6+(%eax)
10096          movb %dh,7+(%eax)
10097          rorl $16,%edx
10098          #NO_APP
10099
10100          So here we provide the missing zero.  */
10101
10102       *displacement_string_end = '0';
10103     }
10104 #endif
10105   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10106   if (gotfree_input_line)
10107     input_line_pointer = gotfree_input_line;
10108
10109   exp_seg = expression (exp);
10110
10111   SKIP_WHITESPACE ();
10112   if (*input_line_pointer)
10113     as_bad (_("junk `%s' after expression"), input_line_pointer);
10114 #if GCC_ASM_O_HACK
10115   RESTORE_END_STRING (disp_end + 1);
10116 #endif
10117   input_line_pointer = save_input_line_pointer;
10118   if (gotfree_input_line)
10119     {
10120       free (gotfree_input_line);
10121
10122       if (exp->X_op == O_constant || exp->X_op == O_register)
10123         exp->X_op = O_illegal;
10124     }
10125
10126   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10127
10128   RESTORE_END_STRING (disp_end);
10129
10130   return ret;
10131 }
10132
10133 static int
10134 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10135                             i386_operand_type types, const char *disp_start)
10136 {
10137   i386_operand_type bigdisp;
10138   int ret = 1;
10139
10140   /* We do this to make sure that the section symbol is in
10141      the symbol table.  We will ultimately change the relocation
10142      to be relative to the beginning of the section.  */
10143   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10144       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10145       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10146     {
10147       if (exp->X_op != O_symbol)
10148         goto inv_disp;
10149
10150       if (S_IS_LOCAL (exp->X_add_symbol)
10151           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10152           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10153         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10154       exp->X_op = O_subtract;
10155       exp->X_op_symbol = GOT_symbol;
10156       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10157         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10158       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10159         i.reloc[this_operand] = BFD_RELOC_64;
10160       else
10161         i.reloc[this_operand] = BFD_RELOC_32;
10162     }
10163
10164   else if (exp->X_op == O_absent
10165            || exp->X_op == O_illegal
10166            || exp->X_op == O_big)
10167     {
10168     inv_disp:
10169       as_bad (_("missing or invalid displacement expression `%s'"),
10170               disp_start);
10171       ret = 0;
10172     }
10173
10174   else if (flag_code == CODE_64BIT
10175            && !i.prefix[ADDR_PREFIX]
10176            && exp->X_op == O_constant)
10177     {
10178       /* Since displacement is signed extended to 64bit, don't allow
10179          disp32 and turn off disp32s if they are out of range.  */
10180       i.types[this_operand].bitfield.disp32 = 0;
10181       if (!fits_in_signed_long (exp->X_add_number))
10182         {
10183           i.types[this_operand].bitfield.disp32s = 0;
10184           if (i.types[this_operand].bitfield.baseindex)
10185             {
10186               as_bad (_("0x%lx out range of signed 32bit displacement"),
10187                       (long) exp->X_add_number);
10188               ret = 0;
10189             }
10190         }
10191     }
10192
10193 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10194   else if (exp->X_op != O_constant
10195            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10196            && exp_seg != absolute_section
10197            && exp_seg != text_section
10198            && exp_seg != data_section
10199            && exp_seg != bss_section
10200            && exp_seg != undefined_section
10201            && !bfd_is_com_section (exp_seg))
10202     {
10203       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10204       ret = 0;
10205     }
10206 #endif
10207
10208   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10209       /* Constants get taken care of by optimize_disp().  */
10210       && exp->X_op != O_constant)
10211     i.types[this_operand].bitfield.disp8 = 1;
10212
10213   /* Check if this is a displacement only operand.  */
10214   bigdisp = i.types[this_operand];
10215   bigdisp.bitfield.disp8 = 0;
10216   bigdisp.bitfield.disp16 = 0;
10217   bigdisp.bitfield.disp32 = 0;
10218   bigdisp.bitfield.disp32s = 0;
10219   bigdisp.bitfield.disp64 = 0;
10220   if (operand_type_all_zero (&bigdisp))
10221     i.types[this_operand] = operand_type_and (i.types[this_operand],
10222                                               types);
10223
10224   return ret;
10225 }
10226
10227 /* Return the active addressing mode, taking address override and
10228    registers forming the address into consideration.  Update the
10229    address override prefix if necessary.  */
10230
10231 static enum flag_code
10232 i386_addressing_mode (void)
10233 {
10234   enum flag_code addr_mode;
10235
10236   if (i.prefix[ADDR_PREFIX])
10237     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10238   else
10239     {
10240       addr_mode = flag_code;
10241
10242 #if INFER_ADDR_PREFIX
10243       if (i.mem_operands == 0)
10244         {
10245           /* Infer address prefix from the first memory operand.  */
10246           const reg_entry *addr_reg = i.base_reg;
10247
10248           if (addr_reg == NULL)
10249             addr_reg = i.index_reg;
10250
10251           if (addr_reg)
10252             {
10253               if (addr_reg->reg_type.bitfield.dword)
10254                 addr_mode = CODE_32BIT;
10255               else if (flag_code != CODE_64BIT
10256                        && addr_reg->reg_type.bitfield.word)
10257                 addr_mode = CODE_16BIT;
10258
10259               if (addr_mode != flag_code)
10260                 {
10261                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10262                   i.prefixes += 1;
10263                   /* Change the size of any displacement too.  At most one
10264                      of Disp16 or Disp32 is set.
10265                      FIXME.  There doesn't seem to be any real need for
10266                      separate Disp16 and Disp32 flags.  The same goes for
10267                      Imm16 and Imm32.  Removing them would probably clean
10268                      up the code quite a lot.  */
10269                   if (flag_code != CODE_64BIT
10270                       && (i.types[this_operand].bitfield.disp16
10271                           || i.types[this_operand].bitfield.disp32))
10272                     i.types[this_operand]
10273                       = operand_type_xor (i.types[this_operand], disp16_32);
10274                 }
10275             }
10276         }
10277 #endif
10278     }
10279
10280   return addr_mode;
10281 }
10282
10283 /* Make sure the memory operand we've been dealt is valid.
10284    Return 1 on success, 0 on a failure.  */
10285
10286 static int
10287 i386_index_check (const char *operand_string)
10288 {
10289   const char *kind = "base/index";
10290   enum flag_code addr_mode = i386_addressing_mode ();
10291
10292   if (current_templates->start->opcode_modifier.isstring
10293       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10294       && (current_templates->end[-1].opcode_modifier.isstring
10295           || i.mem_operands))
10296     {
10297       /* Memory operands of string insns are special in that they only allow
10298          a single register (rDI, rSI, or rBX) as their memory address.  */
10299       const reg_entry *expected_reg;
10300       static const char *di_si[][2] =
10301         {
10302           { "esi", "edi" },
10303           { "si", "di" },
10304           { "rsi", "rdi" }
10305         };
10306       static const char *bx[] = { "ebx", "bx", "rbx" };
10307
10308       kind = "string address";
10309
10310       if (current_templates->start->opcode_modifier.repprefixok)
10311         {
10312           int es_op = current_templates->end[-1].opcode_modifier.isstring
10313                       - IS_STRING_ES_OP0;
10314           int op = 0;
10315
10316           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10317               || ((!i.mem_operands != !intel_syntax)
10318                   && current_templates->end[-1].operand_types[1]
10319                      .bitfield.baseindex))
10320             op = 1;
10321           expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10322         }
10323       else
10324         expected_reg = hash_find (reg_hash, bx[addr_mode]);
10325
10326       if (i.base_reg != expected_reg
10327           || i.index_reg
10328           || operand_type_check (i.types[this_operand], disp))
10329         {
10330           /* The second memory operand must have the same size as
10331              the first one.  */
10332           if (i.mem_operands
10333               && i.base_reg
10334               && !((addr_mode == CODE_64BIT
10335                     && i.base_reg->reg_type.bitfield.qword)
10336                    || (addr_mode == CODE_32BIT
10337                        ? i.base_reg->reg_type.bitfield.dword
10338                        : i.base_reg->reg_type.bitfield.word)))
10339             goto bad_address;
10340
10341           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10342                    operand_string,
10343                    intel_syntax ? '[' : '(',
10344                    register_prefix,
10345                    expected_reg->reg_name,
10346                    intel_syntax ? ']' : ')');
10347           return 1;
10348         }
10349       else
10350         return 1;
10351
10352 bad_address:
10353       as_bad (_("`%s' is not a valid %s expression"),
10354               operand_string, kind);
10355       return 0;
10356     }
10357   else
10358     {
10359       if (addr_mode != CODE_16BIT)
10360         {
10361           /* 32-bit/64-bit checks.  */
10362           if ((i.base_reg
10363                && ((addr_mode == CODE_64BIT
10364                     ? !i.base_reg->reg_type.bitfield.qword
10365                     : !i.base_reg->reg_type.bitfield.dword)
10366                    || (i.index_reg && i.base_reg->reg_num == RegIP)
10367                    || i.base_reg->reg_num == RegIZ))
10368               || (i.index_reg
10369                   && !i.index_reg->reg_type.bitfield.xmmword
10370                   && !i.index_reg->reg_type.bitfield.ymmword
10371                   && !i.index_reg->reg_type.bitfield.zmmword
10372                   && ((addr_mode == CODE_64BIT
10373                        ? !i.index_reg->reg_type.bitfield.qword
10374                        : !i.index_reg->reg_type.bitfield.dword)
10375                       || !i.index_reg->reg_type.bitfield.baseindex)))
10376             goto bad_address;
10377
10378           /* bndmk, bndldx, and bndstx have special restrictions. */
10379           if (current_templates->start->base_opcode == 0xf30f1b
10380               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10381             {
10382               /* They cannot use RIP-relative addressing. */
10383               if (i.base_reg && i.base_reg->reg_num == RegIP)
10384                 {
10385                   as_bad (_("`%s' cannot be used here"), operand_string);
10386                   return 0;
10387                 }
10388
10389               /* bndldx and bndstx ignore their scale factor. */
10390               if (current_templates->start->base_opcode != 0xf30f1b
10391                   && i.log2_scale_factor)
10392                 as_warn (_("register scaling is being ignored here"));
10393             }
10394         }
10395       else
10396         {
10397           /* 16-bit checks.  */
10398           if ((i.base_reg
10399                && (!i.base_reg->reg_type.bitfield.word
10400                    || !i.base_reg->reg_type.bitfield.baseindex))
10401               || (i.index_reg
10402                   && (!i.index_reg->reg_type.bitfield.word
10403                       || !i.index_reg->reg_type.bitfield.baseindex
10404                       || !(i.base_reg
10405                            && i.base_reg->reg_num < 6
10406                            && i.index_reg->reg_num >= 6
10407                            && i.log2_scale_factor == 0))))
10408             goto bad_address;
10409         }
10410     }
10411   return 1;
10412 }
10413
10414 /* Handle vector immediates.  */
10415
10416 static int
10417 RC_SAE_immediate (const char *imm_start)
10418 {
10419   unsigned int match_found, j;
10420   const char *pstr = imm_start;
10421   expressionS *exp;
10422
10423   if (*pstr != '{')
10424     return 0;
10425
10426   pstr++;
10427   match_found = 0;
10428   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10429     {
10430       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10431         {
10432           if (!i.rounding)
10433             {
10434               rc_op.type = RC_NamesTable[j].type;
10435               rc_op.operand = this_operand;
10436               i.rounding = &rc_op;
10437             }
10438           else
10439             {
10440               as_bad (_("duplicated `%s'"), imm_start);
10441               return 0;
10442             }
10443           pstr += RC_NamesTable[j].len;
10444           match_found = 1;
10445           break;
10446         }
10447     }
10448   if (!match_found)
10449     return 0;
10450
10451   if (*pstr++ != '}')
10452     {
10453       as_bad (_("Missing '}': '%s'"), imm_start);
10454       return 0;
10455     }
10456   /* RC/SAE immediate string should contain nothing more.  */;
10457   if (*pstr != 0)
10458     {
10459       as_bad (_("Junk after '}': '%s'"), imm_start);
10460       return 0;
10461     }
10462
10463   exp = &im_expressions[i.imm_operands++];
10464   i.op[this_operand].imms = exp;
10465
10466   exp->X_op = O_constant;
10467   exp->X_add_number = 0;
10468   exp->X_add_symbol = (symbolS *) 0;
10469   exp->X_op_symbol = (symbolS *) 0;
10470
10471   i.types[this_operand].bitfield.imm8 = 1;
10472   return 1;
10473 }
10474
10475 /* Only string instructions can have a second memory operand, so
10476    reduce current_templates to just those if it contains any.  */
10477 static int
10478 maybe_adjust_templates (void)
10479 {
10480   const insn_template *t;
10481
10482   gas_assert (i.mem_operands == 1);
10483
10484   for (t = current_templates->start; t < current_templates->end; ++t)
10485     if (t->opcode_modifier.isstring)
10486       break;
10487
10488   if (t < current_templates->end)
10489     {
10490       static templates aux_templates;
10491       bfd_boolean recheck;
10492
10493       aux_templates.start = t;
10494       for (; t < current_templates->end; ++t)
10495         if (!t->opcode_modifier.isstring)
10496           break;
10497       aux_templates.end = t;
10498
10499       /* Determine whether to re-check the first memory operand.  */
10500       recheck = (aux_templates.start != current_templates->start
10501                  || t != current_templates->end);
10502
10503       current_templates = &aux_templates;
10504
10505       if (recheck)
10506         {
10507           i.mem_operands = 0;
10508           if (i.memop1_string != NULL
10509               && i386_index_check (i.memop1_string) == 0)
10510             return 0;
10511           i.mem_operands = 1;
10512         }
10513     }
10514
10515   return 1;
10516 }
10517
10518 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
10519    on error.  */
10520
10521 static int
10522 i386_att_operand (char *operand_string)
10523 {
10524   const reg_entry *r;
10525   char *end_op;
10526   char *op_string = operand_string;
10527
10528   if (is_space_char (*op_string))
10529     ++op_string;
10530
10531   /* We check for an absolute prefix (differentiating,
10532      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
10533   if (*op_string == ABSOLUTE_PREFIX)
10534     {
10535       ++op_string;
10536       if (is_space_char (*op_string))
10537         ++op_string;
10538       i.jumpabsolute = TRUE;
10539     }
10540
10541   /* Check if operand is a register.  */
10542   if ((r = parse_register (op_string, &end_op)) != NULL)
10543     {
10544       i386_operand_type temp;
10545
10546       /* Check for a segment override by searching for ':' after a
10547          segment register.  */
10548       op_string = end_op;
10549       if (is_space_char (*op_string))
10550         ++op_string;
10551       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10552         {
10553           switch (r->reg_num)
10554             {
10555             case 0:
10556               i.seg[i.mem_operands] = &es;
10557               break;
10558             case 1:
10559               i.seg[i.mem_operands] = &cs;
10560               break;
10561             case 2:
10562               i.seg[i.mem_operands] = &ss;
10563               break;
10564             case 3:
10565               i.seg[i.mem_operands] = &ds;
10566               break;
10567             case 4:
10568               i.seg[i.mem_operands] = &fs;
10569               break;
10570             case 5:
10571               i.seg[i.mem_operands] = &gs;
10572               break;
10573             }
10574
10575           /* Skip the ':' and whitespace.  */
10576           ++op_string;
10577           if (is_space_char (*op_string))
10578             ++op_string;
10579
10580           if (!is_digit_char (*op_string)
10581               && !is_identifier_char (*op_string)
10582               && *op_string != '('
10583               && *op_string != ABSOLUTE_PREFIX)
10584             {
10585               as_bad (_("bad memory operand `%s'"), op_string);
10586               return 0;
10587             }
10588           /* Handle case of %es:*foo.  */
10589           if (*op_string == ABSOLUTE_PREFIX)
10590             {
10591               ++op_string;
10592               if (is_space_char (*op_string))
10593                 ++op_string;
10594               i.jumpabsolute = TRUE;
10595             }
10596           goto do_memory_reference;
10597         }
10598
10599       /* Handle vector operations.  */
10600       if (*op_string == '{')
10601         {
10602           op_string = check_VecOperations (op_string, NULL);
10603           if (op_string == NULL)
10604             return 0;
10605         }
10606
10607       if (*op_string)
10608         {
10609           as_bad (_("junk `%s' after register"), op_string);
10610           return 0;
10611         }
10612       temp = r->reg_type;
10613       temp.bitfield.baseindex = 0;
10614       i.types[this_operand] = operand_type_or (i.types[this_operand],
10615                                                temp);
10616       i.types[this_operand].bitfield.unspecified = 0;
10617       i.op[this_operand].regs = r;
10618       i.reg_operands++;
10619     }
10620   else if (*op_string == REGISTER_PREFIX)
10621     {
10622       as_bad (_("bad register name `%s'"), op_string);
10623       return 0;
10624     }
10625   else if (*op_string == IMMEDIATE_PREFIX)
10626     {
10627       ++op_string;
10628       if (i.jumpabsolute)
10629         {
10630           as_bad (_("immediate operand illegal with absolute jump"));
10631           return 0;
10632         }
10633       if (!i386_immediate (op_string))
10634         return 0;
10635     }
10636   else if (RC_SAE_immediate (operand_string))
10637     {
10638       /* If it is a RC or SAE immediate, do nothing.  */
10639       ;
10640     }
10641   else if (is_digit_char (*op_string)
10642            || is_identifier_char (*op_string)
10643            || *op_string == '"'
10644            || *op_string == '(')
10645     {
10646       /* This is a memory reference of some sort.  */
10647       char *base_string;
10648
10649       /* Start and end of displacement string expression (if found).  */
10650       char *displacement_string_start;
10651       char *displacement_string_end;
10652       char *vop_start;
10653
10654     do_memory_reference:
10655       if (i.mem_operands == 1 && !maybe_adjust_templates ())
10656         return 0;
10657       if ((i.mem_operands == 1
10658            && !current_templates->start->opcode_modifier.isstring)
10659           || i.mem_operands == 2)
10660         {
10661           as_bad (_("too many memory references for `%s'"),
10662                   current_templates->start->name);
10663           return 0;
10664         }
10665
10666       /* Check for base index form.  We detect the base index form by
10667          looking for an ')' at the end of the operand, searching
10668          for the '(' matching it, and finding a REGISTER_PREFIX or ','
10669          after the '('.  */
10670       base_string = op_string + strlen (op_string);
10671
10672       /* Handle vector operations.  */
10673       vop_start = strchr (op_string, '{');
10674       if (vop_start && vop_start < base_string)
10675         {
10676           if (check_VecOperations (vop_start, base_string) == NULL)
10677             return 0;
10678           base_string = vop_start;
10679         }
10680
10681       --base_string;
10682       if (is_space_char (*base_string))
10683         --base_string;
10684
10685       /* If we only have a displacement, set-up for it to be parsed later.  */
10686       displacement_string_start = op_string;
10687       displacement_string_end = base_string + 1;
10688
10689       if (*base_string == ')')
10690         {
10691           char *temp_string;
10692           unsigned int parens_balanced = 1;
10693           /* We've already checked that the number of left & right ()'s are
10694              equal, so this loop will not be infinite.  */
10695           do
10696             {
10697               base_string--;
10698               if (*base_string == ')')
10699                 parens_balanced++;
10700               if (*base_string == '(')
10701                 parens_balanced--;
10702             }
10703           while (parens_balanced);
10704
10705           temp_string = base_string;
10706
10707           /* Skip past '(' and whitespace.  */
10708           ++base_string;
10709           if (is_space_char (*base_string))
10710             ++base_string;
10711
10712           if (*base_string == ','
10713               || ((i.base_reg = parse_register (base_string, &end_op))
10714                   != NULL))
10715             {
10716               displacement_string_end = temp_string;
10717
10718               i.types[this_operand].bitfield.baseindex = 1;
10719
10720               if (i.base_reg)
10721                 {
10722                   base_string = end_op;
10723                   if (is_space_char (*base_string))
10724                     ++base_string;
10725                 }
10726
10727               /* There may be an index reg or scale factor here.  */
10728               if (*base_string == ',')
10729                 {
10730                   ++base_string;
10731                   if (is_space_char (*base_string))
10732                     ++base_string;
10733
10734                   if ((i.index_reg = parse_register (base_string, &end_op))
10735                       != NULL)
10736                     {
10737                       base_string = end_op;
10738                       if (is_space_char (*base_string))
10739                         ++base_string;
10740                       if (*base_string == ',')
10741                         {
10742                           ++base_string;
10743                           if (is_space_char (*base_string))
10744                             ++base_string;
10745                         }
10746                       else if (*base_string != ')')
10747                         {
10748                           as_bad (_("expecting `,' or `)' "
10749                                     "after index register in `%s'"),
10750                                   operand_string);
10751                           return 0;
10752                         }
10753                     }
10754                   else if (*base_string == REGISTER_PREFIX)
10755                     {
10756                       end_op = strchr (base_string, ',');
10757                       if (end_op)
10758                         *end_op = '\0';
10759                       as_bad (_("bad register name `%s'"), base_string);
10760                       return 0;
10761                     }
10762
10763                   /* Check for scale factor.  */
10764                   if (*base_string != ')')
10765                     {
10766                       char *end_scale = i386_scale (base_string);
10767
10768                       if (!end_scale)
10769                         return 0;
10770
10771                       base_string = end_scale;
10772                       if (is_space_char (*base_string))
10773                         ++base_string;
10774                       if (*base_string != ')')
10775                         {
10776                           as_bad (_("expecting `)' "
10777                                     "after scale factor in `%s'"),
10778                                   operand_string);
10779                           return 0;
10780                         }
10781                     }
10782                   else if (!i.index_reg)
10783                     {
10784                       as_bad (_("expecting index register or scale factor "
10785                                 "after `,'; got '%c'"),
10786                               *base_string);
10787                       return 0;
10788                     }
10789                 }
10790               else if (*base_string != ')')
10791                 {
10792                   as_bad (_("expecting `,' or `)' "
10793                             "after base register in `%s'"),
10794                           operand_string);
10795                   return 0;
10796                 }
10797             }
10798           else if (*base_string == REGISTER_PREFIX)
10799             {
10800               end_op = strchr (base_string, ',');
10801               if (end_op)
10802                 *end_op = '\0';
10803               as_bad (_("bad register name `%s'"), base_string);
10804               return 0;
10805             }
10806         }
10807
10808       /* If there's an expression beginning the operand, parse it,
10809          assuming displacement_string_start and
10810          displacement_string_end are meaningful.  */
10811       if (displacement_string_start != displacement_string_end)
10812         {
10813           if (!i386_displacement (displacement_string_start,
10814                                   displacement_string_end))
10815             return 0;
10816         }
10817
10818       /* Special case for (%dx) while doing input/output op.  */
10819       if (i.base_reg
10820           && i.base_reg->reg_type.bitfield.instance == RegD
10821           && i.base_reg->reg_type.bitfield.word
10822           && i.index_reg == 0
10823           && i.log2_scale_factor == 0
10824           && i.seg[i.mem_operands] == 0
10825           && !operand_type_check (i.types[this_operand], disp))
10826         {
10827           i.types[this_operand] = i.base_reg->reg_type;
10828           return 1;
10829         }
10830
10831       if (i386_index_check (operand_string) == 0)
10832         return 0;
10833       i.flags[this_operand] |= Operand_Mem;
10834       if (i.mem_operands == 0)
10835         i.memop1_string = xstrdup (operand_string);
10836       i.mem_operands++;
10837     }
10838   else
10839     {
10840       /* It's not a memory operand; argh!  */
10841       as_bad (_("invalid char %s beginning operand %d `%s'"),
10842               output_invalid (*op_string),
10843               this_operand + 1,
10844               op_string);
10845       return 0;
10846     }
10847   return 1;                     /* Normal return.  */
10848 }
10849 \f
10850 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10851    that an rs_machine_dependent frag may reach.  */
10852
10853 unsigned int
10854 i386_frag_max_var (fragS *frag)
10855 {
10856   /* The only relaxable frags are for jumps.
10857      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
10858   gas_assert (frag->fr_type == rs_machine_dependent);
10859   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10860 }
10861
10862 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10863 static int
10864 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10865 {
10866   /* STT_GNU_IFUNC symbol must go through PLT.  */
10867   if ((symbol_get_bfdsym (fr_symbol)->flags
10868        & BSF_GNU_INDIRECT_FUNCTION) != 0)
10869     return 0;
10870
10871   if (!S_IS_EXTERNAL (fr_symbol))
10872     /* Symbol may be weak or local.  */
10873     return !S_IS_WEAK (fr_symbol);
10874
10875   /* Global symbols with non-default visibility can't be preempted. */
10876   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10877     return 1;
10878
10879   if (fr_var != NO_RELOC)
10880     switch ((enum bfd_reloc_code_real) fr_var)
10881       {
10882       case BFD_RELOC_386_PLT32:
10883       case BFD_RELOC_X86_64_PLT32:
10884         /* Symbol with PLT relocation may be preempted. */
10885         return 0;
10886       default:
10887         abort ();
10888       }
10889
10890   /* Global symbols with default visibility in a shared library may be
10891      preempted by another definition.  */
10892   return !shared;
10893 }
10894 #endif
10895
10896 /* Return the next non-empty frag.  */
10897
10898 static fragS *
10899 i386_next_non_empty_frag (fragS *fragP)
10900 {
10901   /* There may be a frag with a ".fill 0" when there is no room in
10902      the current frag for frag_grow in output_insn.  */
10903   for (fragP = fragP->fr_next;
10904        (fragP != NULL
10905         && fragP->fr_type == rs_fill
10906         && fragP->fr_fix == 0);
10907        fragP = fragP->fr_next)
10908     ;
10909   return fragP;
10910 }
10911
10912 /* Return the next jcc frag after BRANCH_PADDING.  */
10913
10914 static fragS *
10915 i386_next_jcc_frag (fragS *fragP)
10916 {
10917   if (!fragP)
10918     return NULL;
10919
10920   if (fragP->fr_type == rs_machine_dependent
10921       && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10922           == BRANCH_PADDING))
10923     {
10924       fragP = i386_next_non_empty_frag (fragP);
10925       if (fragP->fr_type != rs_machine_dependent)
10926         return NULL;
10927       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10928         return fragP;
10929     }
10930
10931   return NULL;
10932 }
10933
10934 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
10935
10936 static void
10937 i386_classify_machine_dependent_frag (fragS *fragP)
10938 {
10939   fragS *cmp_fragP;
10940   fragS *pad_fragP;
10941   fragS *branch_fragP;
10942   fragS *next_fragP;
10943   unsigned int max_prefix_length;
10944
10945   if (fragP->tc_frag_data.classified)
10946     return;
10947
10948   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
10949      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
10950   for (next_fragP = fragP;
10951        next_fragP != NULL;
10952        next_fragP = next_fragP->fr_next)
10953     {
10954       next_fragP->tc_frag_data.classified = 1;
10955       if (next_fragP->fr_type == rs_machine_dependent)
10956         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10957           {
10958           case BRANCH_PADDING:
10959             /* The BRANCH_PADDING frag must be followed by a branch
10960                frag.  */
10961             branch_fragP = i386_next_non_empty_frag (next_fragP);
10962             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10963             break;
10964           case FUSED_JCC_PADDING:
10965             /* Check if this is a fused jcc:
10966                FUSED_JCC_PADDING
10967                CMP like instruction
10968                BRANCH_PADDING
10969                COND_JUMP
10970                */
10971             cmp_fragP = i386_next_non_empty_frag (next_fragP);
10972             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10973             branch_fragP = i386_next_jcc_frag (pad_fragP);
10974             if (branch_fragP)
10975               {
10976                 /* The BRANCH_PADDING frag is merged with the
10977                    FUSED_JCC_PADDING frag.  */
10978                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10979                 /* CMP like instruction size.  */
10980                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10981                 frag_wane (pad_fragP);
10982                 /* Skip to branch_fragP.  */
10983                 next_fragP = branch_fragP;
10984               }
10985             else if (next_fragP->tc_frag_data.max_prefix_length)
10986               {
10987                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10988                    a fused jcc.  */
10989                 next_fragP->fr_subtype
10990                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10991                 next_fragP->tc_frag_data.max_bytes
10992                   = next_fragP->tc_frag_data.max_prefix_length;
10993                 /* This will be updated in the BRANCH_PREFIX scan.  */
10994                 next_fragP->tc_frag_data.max_prefix_length = 0;
10995               }
10996             else
10997               frag_wane (next_fragP);
10998             break;
10999           }
11000     }
11001
11002   /* Stop if there is no BRANCH_PREFIX.  */
11003   if (!align_branch_prefix_size)
11004     return;
11005
11006   /* Scan for BRANCH_PREFIX.  */
11007   for (; fragP != NULL; fragP = fragP->fr_next)
11008     {
11009       if (fragP->fr_type != rs_machine_dependent
11010           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11011               != BRANCH_PREFIX))
11012         continue;
11013
11014       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11015          COND_JUMP_PREFIX.  */
11016       max_prefix_length = 0;
11017       for (next_fragP = fragP;
11018            next_fragP != NULL;
11019            next_fragP = next_fragP->fr_next)
11020         {
11021           if (next_fragP->fr_type == rs_fill)
11022             /* Skip rs_fill frags.  */
11023             continue;
11024           else if (next_fragP->fr_type != rs_machine_dependent)
11025             /* Stop for all other frags.  */
11026             break;
11027
11028           /* rs_machine_dependent frags.  */
11029           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11030               == BRANCH_PREFIX)
11031             {
11032               /* Count BRANCH_PREFIX frags.  */
11033               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11034                 {
11035                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11036                   frag_wane (next_fragP);
11037                 }
11038               else
11039                 max_prefix_length
11040                   += next_fragP->tc_frag_data.max_bytes;
11041             }
11042           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11043                     == BRANCH_PADDING)
11044                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11045                        == FUSED_JCC_PADDING))
11046             {
11047               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11048               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11049               break;
11050             }
11051           else
11052             /* Stop for other rs_machine_dependent frags.  */
11053             break;
11054         }
11055
11056       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11057
11058       /* Skip to the next frag.  */
11059       fragP = next_fragP;
11060     }
11061 }
11062
11063 /* Compute padding size for
11064
11065         FUSED_JCC_PADDING
11066         CMP like instruction
11067         BRANCH_PADDING
11068         COND_JUMP/UNCOND_JUMP
11069
11070    or
11071
11072         BRANCH_PADDING
11073         COND_JUMP/UNCOND_JUMP
11074  */
11075
11076 static int
11077 i386_branch_padding_size (fragS *fragP, offsetT address)
11078 {
11079   unsigned int offset, size, padding_size;
11080   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11081
11082   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11083   if (!address)
11084     address = fragP->fr_address;
11085   address += fragP->fr_fix;
11086
11087   /* CMP like instrunction size.  */
11088   size = fragP->tc_frag_data.cmp_size;
11089
11090   /* The base size of the branch frag.  */
11091   size += branch_fragP->fr_fix;
11092
11093   /* Add opcode and displacement bytes for the rs_machine_dependent
11094      branch frag.  */
11095   if (branch_fragP->fr_type == rs_machine_dependent)
11096     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11097
11098   /* Check if branch is within boundary and doesn't end at the last
11099      byte.  */
11100   offset = address & ((1U << align_branch_power) - 1);
11101   if ((offset + size) >= (1U << align_branch_power))
11102     /* Padding needed to avoid crossing boundary.  */
11103     padding_size = (1U << align_branch_power) - offset;
11104   else
11105     /* No padding needed.  */
11106     padding_size = 0;
11107
11108   /* The return value may be saved in tc_frag_data.length which is
11109      unsigned byte.  */
11110   if (!fits_in_unsigned_byte (padding_size))
11111     abort ();
11112
11113   return padding_size;
11114 }
11115
11116 /* i386_generic_table_relax_frag()
11117
11118    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11119    grow/shrink padding to align branch frags.  Hand others to
11120    relax_frag().  */
11121
11122 long
11123 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11124 {
11125   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11126       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11127     {
11128       long padding_size = i386_branch_padding_size (fragP, 0);
11129       long grow = padding_size - fragP->tc_frag_data.length;
11130
11131       /* When the BRANCH_PREFIX frag is used, the computed address
11132          must match the actual address and there should be no padding.  */
11133       if (fragP->tc_frag_data.padding_address
11134           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11135               || padding_size))
11136         abort ();
11137
11138       /* Update the padding size.  */
11139       if (grow)
11140         fragP->tc_frag_data.length = padding_size;
11141
11142       return grow;
11143     }
11144   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11145     {
11146       fragS *padding_fragP, *next_fragP;
11147       long padding_size, left_size, last_size;
11148
11149       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11150       if (!padding_fragP)
11151         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11152         return (fragP->tc_frag_data.length
11153                 - fragP->tc_frag_data.last_length);
11154
11155       /* Compute the relative address of the padding frag in the very
11156         first time where the BRANCH_PREFIX frag sizes are zero.  */
11157       if (!fragP->tc_frag_data.padding_address)
11158         fragP->tc_frag_data.padding_address
11159           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11160
11161       /* First update the last length from the previous interation.  */
11162       left_size = fragP->tc_frag_data.prefix_length;
11163       for (next_fragP = fragP;
11164            next_fragP != padding_fragP;
11165            next_fragP = next_fragP->fr_next)
11166         if (next_fragP->fr_type == rs_machine_dependent
11167             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11168                 == BRANCH_PREFIX))
11169           {
11170             if (left_size)
11171               {
11172                 int max = next_fragP->tc_frag_data.max_bytes;
11173                 if (max)
11174                   {
11175                     int size;
11176                     if (max > left_size)
11177                       size = left_size;
11178                     else
11179                       size = max;
11180                     left_size -= size;
11181                     next_fragP->tc_frag_data.last_length = size;
11182                   }
11183               }
11184             else
11185               next_fragP->tc_frag_data.last_length = 0;
11186           }
11187
11188       /* Check the padding size for the padding frag.  */
11189       padding_size = i386_branch_padding_size
11190         (padding_fragP, (fragP->fr_address
11191                          + fragP->tc_frag_data.padding_address));
11192
11193       last_size = fragP->tc_frag_data.prefix_length;
11194       /* Check if there is change from the last interation.  */
11195       if (padding_size == last_size)
11196         {
11197           /* Update the expected address of the padding frag.  */
11198           padding_fragP->tc_frag_data.padding_address
11199             = (fragP->fr_address + padding_size
11200                + fragP->tc_frag_data.padding_address);
11201           return 0;
11202         }
11203
11204       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11205         {
11206           /* No padding if there is no sufficient room.  Clear the
11207              expected address of the padding frag.  */
11208           padding_fragP->tc_frag_data.padding_address = 0;
11209           padding_size = 0;
11210         }
11211       else
11212         /* Store the expected address of the padding frag.  */
11213         padding_fragP->tc_frag_data.padding_address
11214           = (fragP->fr_address + padding_size
11215              + fragP->tc_frag_data.padding_address);
11216
11217       fragP->tc_frag_data.prefix_length = padding_size;
11218
11219       /* Update the length for the current interation.  */
11220       left_size = padding_size;
11221       for (next_fragP = fragP;
11222            next_fragP != padding_fragP;
11223            next_fragP = next_fragP->fr_next)
11224         if (next_fragP->fr_type == rs_machine_dependent
11225             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11226                 == BRANCH_PREFIX))
11227           {
11228             if (left_size)
11229               {
11230                 int max = next_fragP->tc_frag_data.max_bytes;
11231                 if (max)
11232                   {
11233                     int size;
11234                     if (max > left_size)
11235                       size = left_size;
11236                     else
11237                       size = max;
11238                     left_size -= size;
11239                     next_fragP->tc_frag_data.length = size;
11240                   }
11241               }
11242             else
11243               next_fragP->tc_frag_data.length = 0;
11244           }
11245
11246       return (fragP->tc_frag_data.length
11247               - fragP->tc_frag_data.last_length);
11248     }
11249   return relax_frag (segment, fragP, stretch);
11250 }
11251
11252 /* md_estimate_size_before_relax()
11253
11254    Called just before relax() for rs_machine_dependent frags.  The x86
11255    assembler uses these frags to handle variable size jump
11256    instructions.
11257
11258    Any symbol that is now undefined will not become defined.
11259    Return the correct fr_subtype in the frag.
11260    Return the initial "guess for variable size of frag" to caller.
11261    The guess is actually the growth beyond the fixed part.  Whatever
11262    we do to grow the fixed or variable part contributes to our
11263    returned value.  */
11264
11265 int
11266 md_estimate_size_before_relax (fragS *fragP, segT segment)
11267 {
11268   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11269       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11270       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11271     {
11272       i386_classify_machine_dependent_frag (fragP);
11273       return fragP->tc_frag_data.length;
11274     }
11275
11276   /* We've already got fragP->fr_subtype right;  all we have to do is
11277      check for un-relaxable symbols.  On an ELF system, we can't relax
11278      an externally visible symbol, because it may be overridden by a
11279      shared library.  */
11280   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11281 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11282       || (IS_ELF
11283           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11284                                                 fragP->fr_var))
11285 #endif
11286 #if defined (OBJ_COFF) && defined (TE_PE)
11287       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11288           && S_IS_WEAK (fragP->fr_symbol))
11289 #endif
11290       )
11291     {
11292       /* Symbol is undefined in this segment, or we need to keep a
11293          reloc so that weak symbols can be overridden.  */
11294       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11295       enum bfd_reloc_code_real reloc_type;
11296       unsigned char *opcode;
11297       int old_fr_fix;
11298
11299       if (fragP->fr_var != NO_RELOC)
11300         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11301       else if (size == 2)
11302         reloc_type = BFD_RELOC_16_PCREL;
11303 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11304       else if (need_plt32_p (fragP->fr_symbol))
11305         reloc_type = BFD_RELOC_X86_64_PLT32;
11306 #endif
11307       else
11308         reloc_type = BFD_RELOC_32_PCREL;
11309
11310       old_fr_fix = fragP->fr_fix;
11311       opcode = (unsigned char *) fragP->fr_opcode;
11312
11313       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11314         {
11315         case UNCOND_JUMP:
11316           /* Make jmp (0xeb) a (d)word displacement jump.  */
11317           opcode[0] = 0xe9;
11318           fragP->fr_fix += size;
11319           fix_new (fragP, old_fr_fix, size,
11320                    fragP->fr_symbol,
11321                    fragP->fr_offset, 1,
11322                    reloc_type);
11323           break;
11324
11325         case COND_JUMP86:
11326           if (size == 2
11327               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11328             {
11329               /* Negate the condition, and branch past an
11330                  unconditional jump.  */
11331               opcode[0] ^= 1;
11332               opcode[1] = 3;
11333               /* Insert an unconditional jump.  */
11334               opcode[2] = 0xe9;
11335               /* We added two extra opcode bytes, and have a two byte
11336                  offset.  */
11337               fragP->fr_fix += 2 + 2;
11338               fix_new (fragP, old_fr_fix + 2, 2,
11339                        fragP->fr_symbol,
11340                        fragP->fr_offset, 1,
11341                        reloc_type);
11342               break;
11343             }
11344           /* Fall through.  */
11345
11346         case COND_JUMP:
11347           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11348             {
11349               fixS *fixP;
11350
11351               fragP->fr_fix += 1;
11352               fixP = fix_new (fragP, old_fr_fix, 1,
11353                               fragP->fr_symbol,
11354                               fragP->fr_offset, 1,
11355                               BFD_RELOC_8_PCREL);
11356               fixP->fx_signed = 1;
11357               break;
11358             }
11359
11360           /* This changes the byte-displacement jump 0x7N
11361              to the (d)word-displacement jump 0x0f,0x8N.  */
11362           opcode[1] = opcode[0] + 0x10;
11363           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11364           /* We've added an opcode byte.  */
11365           fragP->fr_fix += 1 + size;
11366           fix_new (fragP, old_fr_fix + 1, size,
11367                    fragP->fr_symbol,
11368                    fragP->fr_offset, 1,
11369                    reloc_type);
11370           break;
11371
11372         default:
11373           BAD_CASE (fragP->fr_subtype);
11374           break;
11375         }
11376       frag_wane (fragP);
11377       return fragP->fr_fix - old_fr_fix;
11378     }
11379
11380   /* Guess size depending on current relax state.  Initially the relax
11381      state will correspond to a short jump and we return 1, because
11382      the variable part of the frag (the branch offset) is one byte
11383      long.  However, we can relax a section more than once and in that
11384      case we must either set fr_subtype back to the unrelaxed state,
11385      or return the value for the appropriate branch.  */
11386   return md_relax_table[fragP->fr_subtype].rlx_length;
11387 }
11388
11389 /* Called after relax() is finished.
11390
11391    In:  Address of frag.
11392         fr_type == rs_machine_dependent.
11393         fr_subtype is what the address relaxed to.
11394
11395    Out: Any fixSs and constants are set up.
11396         Caller will turn frag into a ".space 0".  */
11397
11398 void
11399 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11400                  fragS *fragP)
11401 {
11402   unsigned char *opcode;
11403   unsigned char *where_to_put_displacement = NULL;
11404   offsetT target_address;
11405   offsetT opcode_address;
11406   unsigned int extension = 0;
11407   offsetT displacement_from_opcode_start;
11408
11409   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11410       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11411       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11412     {
11413       /* Generate nop padding.  */
11414       unsigned int size = fragP->tc_frag_data.length;
11415       if (size)
11416         {
11417           if (size > fragP->tc_frag_data.max_bytes)
11418             abort ();
11419
11420           if (flag_debug)
11421             {
11422               const char *msg;
11423               const char *branch = "branch";
11424               const char *prefix = "";
11425               fragS *padding_fragP;
11426               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11427                   == BRANCH_PREFIX)
11428                 {
11429                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11430                   switch (fragP->tc_frag_data.default_prefix)
11431                     {
11432                     default:
11433                       abort ();
11434                       break;
11435                     case CS_PREFIX_OPCODE:
11436                       prefix = " cs";
11437                       break;
11438                     case DS_PREFIX_OPCODE:
11439                       prefix = " ds";
11440                       break;
11441                     case ES_PREFIX_OPCODE:
11442                       prefix = " es";
11443                       break;
11444                     case FS_PREFIX_OPCODE:
11445                       prefix = " fs";
11446                       break;
11447                     case GS_PREFIX_OPCODE:
11448                       prefix = " gs";
11449                       break;
11450                     case SS_PREFIX_OPCODE:
11451                       prefix = " ss";
11452                       break;
11453                     }
11454                   if (padding_fragP)
11455                     msg = _("%s:%u: add %d%s at 0x%llx to align "
11456                             "%s within %d-byte boundary\n");
11457                   else
11458                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
11459                             "align %s within %d-byte boundary\n");
11460                 }
11461               else
11462                 {
11463                   padding_fragP = fragP;
11464                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11465                           "%s within %d-byte boundary\n");
11466                 }
11467
11468               if (padding_fragP)
11469                 switch (padding_fragP->tc_frag_data.branch_type)
11470                   {
11471                   case align_branch_jcc:
11472                     branch = "jcc";
11473                     break;
11474                   case align_branch_fused:
11475                     branch = "fused jcc";
11476                     break;
11477                   case align_branch_jmp:
11478                     branch = "jmp";
11479                     break;
11480                   case align_branch_call:
11481                     branch = "call";
11482                     break;
11483                   case align_branch_indirect:
11484                     branch = "indiret branch";
11485                     break;
11486                   case align_branch_ret:
11487                     branch = "ret";
11488                     break;
11489                   default:
11490                     break;
11491                   }
11492
11493               fprintf (stdout, msg,
11494                        fragP->fr_file, fragP->fr_line, size, prefix,
11495                        (long long) fragP->fr_address, branch,
11496                        1 << align_branch_power);
11497             }
11498           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11499             memset (fragP->fr_opcode,
11500                     fragP->tc_frag_data.default_prefix, size);
11501           else
11502             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11503                                 size, 0);
11504           fragP->fr_fix += size;
11505         }
11506       return;
11507     }
11508
11509   opcode = (unsigned char *) fragP->fr_opcode;
11510
11511   /* Address we want to reach in file space.  */
11512   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11513
11514   /* Address opcode resides at in file space.  */
11515   opcode_address = fragP->fr_address + fragP->fr_fix;
11516
11517   /* Displacement from opcode start to fill into instruction.  */
11518   displacement_from_opcode_start = target_address - opcode_address;
11519
11520   if ((fragP->fr_subtype & BIG) == 0)
11521     {
11522       /* Don't have to change opcode.  */
11523       extension = 1;            /* 1 opcode + 1 displacement  */
11524       where_to_put_displacement = &opcode[1];
11525     }
11526   else
11527     {
11528       if (no_cond_jump_promotion
11529           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11530         as_warn_where (fragP->fr_file, fragP->fr_line,
11531                        _("long jump required"));
11532
11533       switch (fragP->fr_subtype)
11534         {
11535         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11536           extension = 4;                /* 1 opcode + 4 displacement  */
11537           opcode[0] = 0xe9;
11538           where_to_put_displacement = &opcode[1];
11539           break;
11540
11541         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11542           extension = 2;                /* 1 opcode + 2 displacement  */
11543           opcode[0] = 0xe9;
11544           where_to_put_displacement = &opcode[1];
11545           break;
11546
11547         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11548         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11549           extension = 5;                /* 2 opcode + 4 displacement  */
11550           opcode[1] = opcode[0] + 0x10;
11551           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11552           where_to_put_displacement = &opcode[2];
11553           break;
11554
11555         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11556           extension = 3;                /* 2 opcode + 2 displacement  */
11557           opcode[1] = opcode[0] + 0x10;
11558           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11559           where_to_put_displacement = &opcode[2];
11560           break;
11561
11562         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11563           extension = 4;
11564           opcode[0] ^= 1;
11565           opcode[1] = 3;
11566           opcode[2] = 0xe9;
11567           where_to_put_displacement = &opcode[3];
11568           break;
11569
11570         default:
11571           BAD_CASE (fragP->fr_subtype);
11572           break;
11573         }
11574     }
11575
11576   /* If size if less then four we are sure that the operand fits,
11577      but if it's 4, then it could be that the displacement is larger
11578      then -/+ 2GB.  */
11579   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11580       && object_64bit
11581       && ((addressT) (displacement_from_opcode_start - extension
11582                       + ((addressT) 1 << 31))
11583           > (((addressT) 2 << 31) - 1)))
11584     {
11585       as_bad_where (fragP->fr_file, fragP->fr_line,
11586                     _("jump target out of range"));
11587       /* Make us emit 0.  */
11588       displacement_from_opcode_start = extension;
11589     }
11590   /* Now put displacement after opcode.  */
11591   md_number_to_chars ((char *) where_to_put_displacement,
11592                       (valueT) (displacement_from_opcode_start - extension),
11593                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11594   fragP->fr_fix += extension;
11595 }
11596 \f
11597 /* Apply a fixup (fixP) to segment data, once it has been determined
11598    by our caller that we have all the info we need to fix it up.
11599
11600    Parameter valP is the pointer to the value of the bits.
11601
11602    On the 386, immediates, displacements, and data pointers are all in
11603    the same (little-endian) format, so we don't need to care about which
11604    we are handling.  */
11605
11606 void
11607 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11608 {
11609   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11610   valueT value = *valP;
11611
11612 #if !defined (TE_Mach)
11613   if (fixP->fx_pcrel)
11614     {
11615       switch (fixP->fx_r_type)
11616         {
11617         default:
11618           break;
11619
11620         case BFD_RELOC_64:
11621           fixP->fx_r_type = BFD_RELOC_64_PCREL;
11622           break;
11623         case BFD_RELOC_32:
11624         case BFD_RELOC_X86_64_32S:
11625           fixP->fx_r_type = BFD_RELOC_32_PCREL;
11626           break;
11627         case BFD_RELOC_16:
11628           fixP->fx_r_type = BFD_RELOC_16_PCREL;
11629           break;
11630         case BFD_RELOC_8:
11631           fixP->fx_r_type = BFD_RELOC_8_PCREL;
11632           break;
11633         }
11634     }
11635
11636   if (fixP->fx_addsy != NULL
11637       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11638           || fixP->fx_r_type == BFD_RELOC_64_PCREL
11639           || fixP->fx_r_type == BFD_RELOC_16_PCREL
11640           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11641       && !use_rela_relocations)
11642     {
11643       /* This is a hack.  There should be a better way to handle this.
11644          This covers for the fact that bfd_install_relocation will
11645          subtract the current location (for partial_inplace, PC relative
11646          relocations); see more below.  */
11647 #ifndef OBJ_AOUT
11648       if (IS_ELF
11649 #ifdef TE_PE
11650           || OUTPUT_FLAVOR == bfd_target_coff_flavour
11651 #endif
11652           )
11653         value += fixP->fx_where + fixP->fx_frag->fr_address;
11654 #endif
11655 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11656       if (IS_ELF)
11657         {
11658           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11659
11660           if ((sym_seg == seg
11661                || (symbol_section_p (fixP->fx_addsy)
11662                    && sym_seg != absolute_section))
11663               && !generic_force_reloc (fixP))
11664             {
11665               /* Yes, we add the values in twice.  This is because
11666                  bfd_install_relocation subtracts them out again.  I think
11667                  bfd_install_relocation is broken, but I don't dare change
11668                  it.  FIXME.  */
11669               value += fixP->fx_where + fixP->fx_frag->fr_address;
11670             }
11671         }
11672 #endif
11673 #if defined (OBJ_COFF) && defined (TE_PE)
11674       /* For some reason, the PE format does not store a
11675          section address offset for a PC relative symbol.  */
11676       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11677           || S_IS_WEAK (fixP->fx_addsy))
11678         value += md_pcrel_from (fixP);
11679 #endif
11680     }
11681 #if defined (OBJ_COFF) && defined (TE_PE)
11682   if (fixP->fx_addsy != NULL
11683       && S_IS_WEAK (fixP->fx_addsy)
11684       /* PR 16858: Do not modify weak function references.  */
11685       && ! fixP->fx_pcrel)
11686     {
11687 #if !defined (TE_PEP)
11688       /* For x86 PE weak function symbols are neither PC-relative
11689          nor do they set S_IS_FUNCTION.  So the only reliable way
11690          to detect them is to check the flags of their containing
11691          section.  */
11692       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11693           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11694         ;
11695       else
11696 #endif
11697       value -= S_GET_VALUE (fixP->fx_addsy);
11698     }
11699 #endif
11700
11701   /* Fix a few things - the dynamic linker expects certain values here,
11702      and we must not disappoint it.  */
11703 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11704   if (IS_ELF && fixP->fx_addsy)
11705     switch (fixP->fx_r_type)
11706       {
11707       case BFD_RELOC_386_PLT32:
11708       case BFD_RELOC_X86_64_PLT32:
11709         /* Make the jump instruction point to the address of the operand.
11710            At runtime we merely add the offset to the actual PLT entry.
11711            NB: Subtract the offset size only for jump instructions.  */
11712         if (fixP->fx_pcrel)
11713           value = -4;
11714         break;
11715
11716       case BFD_RELOC_386_TLS_GD:
11717       case BFD_RELOC_386_TLS_LDM:
11718       case BFD_RELOC_386_TLS_IE_32:
11719       case BFD_RELOC_386_TLS_IE:
11720       case BFD_RELOC_386_TLS_GOTIE:
11721       case BFD_RELOC_386_TLS_GOTDESC:
11722       case BFD_RELOC_X86_64_TLSGD:
11723       case BFD_RELOC_X86_64_TLSLD:
11724       case BFD_RELOC_X86_64_GOTTPOFF:
11725       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11726         value = 0; /* Fully resolved at runtime.  No addend.  */
11727         /* Fallthrough */
11728       case BFD_RELOC_386_TLS_LE:
11729       case BFD_RELOC_386_TLS_LDO_32:
11730       case BFD_RELOC_386_TLS_LE_32:
11731       case BFD_RELOC_X86_64_DTPOFF32:
11732       case BFD_RELOC_X86_64_DTPOFF64:
11733       case BFD_RELOC_X86_64_TPOFF32:
11734       case BFD_RELOC_X86_64_TPOFF64:
11735         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11736         break;
11737
11738       case BFD_RELOC_386_TLS_DESC_CALL:
11739       case BFD_RELOC_X86_64_TLSDESC_CALL:
11740         value = 0; /* Fully resolved at runtime.  No addend.  */
11741         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11742         fixP->fx_done = 0;
11743         return;
11744
11745       case BFD_RELOC_VTABLE_INHERIT:
11746       case BFD_RELOC_VTABLE_ENTRY:
11747         fixP->fx_done = 0;
11748         return;
11749
11750       default:
11751         break;
11752       }
11753 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
11754   *valP = value;
11755 #endif /* !defined (TE_Mach)  */
11756
11757   /* Are we finished with this relocation now?  */
11758   if (fixP->fx_addsy == NULL)
11759     fixP->fx_done = 1;
11760 #if defined (OBJ_COFF) && defined (TE_PE)
11761   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11762     {
11763       fixP->fx_done = 0;
11764       /* Remember value for tc_gen_reloc.  */
11765       fixP->fx_addnumber = value;
11766       /* Clear out the frag for now.  */
11767       value = 0;
11768     }
11769 #endif
11770   else if (use_rela_relocations)
11771     {
11772       fixP->fx_no_overflow = 1;
11773       /* Remember value for tc_gen_reloc.  */
11774       fixP->fx_addnumber = value;
11775       value = 0;
11776     }
11777
11778   md_number_to_chars (p, value, fixP->fx_size);
11779 }
11780 \f
11781 const char *
11782 md_atof (int type, char *litP, int *sizeP)
11783 {
11784   /* This outputs the LITTLENUMs in REVERSE order;
11785      in accord with the bigendian 386.  */
11786   return ieee_md_atof (type, litP, sizeP, FALSE);
11787 }
11788 \f
11789 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11790
11791 static char *
11792 output_invalid (int c)
11793 {
11794   if (ISPRINT (c))
11795     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11796               "'%c'", c);
11797   else
11798     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11799               "(0x%x)", (unsigned char) c);
11800   return output_invalid_buf;
11801 }
11802
11803 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11804
11805 static const reg_entry *
11806 parse_real_register (char *reg_string, char **end_op)
11807 {
11808   char *s = reg_string;
11809   char *p;
11810   char reg_name_given[MAX_REG_NAME_SIZE + 1];
11811   const reg_entry *r;
11812
11813   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
11814   if (*s == REGISTER_PREFIX)
11815     ++s;
11816
11817   if (is_space_char (*s))
11818     ++s;
11819
11820   p = reg_name_given;
11821   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11822     {
11823       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11824         return (const reg_entry *) NULL;
11825       s++;
11826     }
11827
11828   /* For naked regs, make sure that we are not dealing with an identifier.
11829      This prevents confusing an identifier like `eax_var' with register
11830      `eax'.  */
11831   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11832     return (const reg_entry *) NULL;
11833
11834   *end_op = s;
11835
11836   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11837
11838   /* Handle floating point regs, allowing spaces in the (i) part.  */
11839   if (r == i386_regtab /* %st is first entry of table  */)
11840     {
11841       if (!cpu_arch_flags.bitfield.cpu8087
11842           && !cpu_arch_flags.bitfield.cpu287
11843           && !cpu_arch_flags.bitfield.cpu387)
11844         return (const reg_entry *) NULL;
11845
11846       if (is_space_char (*s))
11847         ++s;
11848       if (*s == '(')
11849         {
11850           ++s;
11851           if (is_space_char (*s))
11852             ++s;
11853           if (*s >= '0' && *s <= '7')
11854             {
11855               int fpr = *s - '0';
11856               ++s;
11857               if (is_space_char (*s))
11858                 ++s;
11859               if (*s == ')')
11860                 {
11861                   *end_op = s + 1;
11862                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11863                   know (r);
11864                   return r + fpr;
11865                 }
11866             }
11867           /* We have "%st(" then garbage.  */
11868           return (const reg_entry *) NULL;
11869         }
11870     }
11871
11872   if (r == NULL || allow_pseudo_reg)
11873     return r;
11874
11875   if (operand_type_all_zero (&r->reg_type))
11876     return (const reg_entry *) NULL;
11877
11878   if ((r->reg_type.bitfield.dword
11879        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11880        || r->reg_type.bitfield.class == RegCR
11881        || r->reg_type.bitfield.class == RegDR
11882        || r->reg_type.bitfield.class == RegTR)
11883       && !cpu_arch_flags.bitfield.cpui386)
11884     return (const reg_entry *) NULL;
11885
11886   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11887     return (const reg_entry *) NULL;
11888
11889   if (!cpu_arch_flags.bitfield.cpuavx512f)
11890     {
11891       if (r->reg_type.bitfield.zmmword
11892           || r->reg_type.bitfield.class == RegMask)
11893         return (const reg_entry *) NULL;
11894
11895       if (!cpu_arch_flags.bitfield.cpuavx)
11896         {
11897           if (r->reg_type.bitfield.ymmword)
11898             return (const reg_entry *) NULL;
11899
11900           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11901             return (const reg_entry *) NULL;
11902         }
11903     }
11904
11905   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11906     return (const reg_entry *) NULL;
11907
11908   /* Don't allow fake index register unless allow_index_reg isn't 0. */
11909   if (!allow_index_reg && r->reg_num == RegIZ)
11910     return (const reg_entry *) NULL;
11911
11912   /* Upper 16 vector registers are only available with VREX in 64bit
11913      mode, and require EVEX encoding.  */
11914   if (r->reg_flags & RegVRex)
11915     {
11916       if (!cpu_arch_flags.bitfield.cpuavx512f
11917           || flag_code != CODE_64BIT)
11918         return (const reg_entry *) NULL;
11919
11920       i.vec_encoding = vex_encoding_evex;
11921     }
11922
11923   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11924       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11925       && flag_code != CODE_64BIT)
11926     return (const reg_entry *) NULL;
11927
11928   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11929       && !intel_syntax)
11930     return (const reg_entry *) NULL;
11931
11932   return r;
11933 }
11934
11935 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11936
11937 static const reg_entry *
11938 parse_register (char *reg_string, char **end_op)
11939 {
11940   const reg_entry *r;
11941
11942   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11943     r = parse_real_register (reg_string, end_op);
11944   else
11945     r = NULL;
11946   if (!r)
11947     {
11948       char *save = input_line_pointer;
11949       char c;
11950       symbolS *symbolP;
11951
11952       input_line_pointer = reg_string;
11953       c = get_symbol_name (&reg_string);
11954       symbolP = symbol_find (reg_string);
11955       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11956         {
11957           const expressionS *e = symbol_get_value_expression (symbolP);
11958
11959           know (e->X_op == O_register);
11960           know (e->X_add_number >= 0
11961                 && (valueT) e->X_add_number < i386_regtab_size);
11962           r = i386_regtab + e->X_add_number;
11963           if ((r->reg_flags & RegVRex))
11964             i.vec_encoding = vex_encoding_evex;
11965           *end_op = input_line_pointer;
11966         }
11967       *input_line_pointer = c;
11968       input_line_pointer = save;
11969     }
11970   return r;
11971 }
11972
11973 int
11974 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11975 {
11976   const reg_entry *r;
11977   char *end = input_line_pointer;
11978
11979   *end = *nextcharP;
11980   r = parse_register (name, &input_line_pointer);
11981   if (r && end <= input_line_pointer)
11982     {
11983       *nextcharP = *input_line_pointer;
11984       *input_line_pointer = 0;
11985       e->X_op = O_register;
11986       e->X_add_number = r - i386_regtab;
11987       return 1;
11988     }
11989   input_line_pointer = end;
11990   *end = 0;
11991   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11992 }
11993
11994 void
11995 md_operand (expressionS *e)
11996 {
11997   char *end;
11998   const reg_entry *r;
11999
12000   switch (*input_line_pointer)
12001     {
12002     case REGISTER_PREFIX:
12003       r = parse_real_register (input_line_pointer, &end);
12004       if (r)
12005         {
12006           e->X_op = O_register;
12007           e->X_add_number = r - i386_regtab;
12008           input_line_pointer = end;
12009         }
12010       break;
12011
12012     case '[':
12013       gas_assert (intel_syntax);
12014       end = input_line_pointer++;
12015       expression (e);
12016       if (*input_line_pointer == ']')
12017         {
12018           ++input_line_pointer;
12019           e->X_op_symbol = make_expr_symbol (e);
12020           e->X_add_symbol = NULL;
12021           e->X_add_number = 0;
12022           e->X_op = O_index;
12023         }
12024       else
12025         {
12026           e->X_op = O_absent;
12027           input_line_pointer = end;
12028         }
12029       break;
12030     }
12031 }
12032
12033 \f
12034 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12035 const char *md_shortopts = "kVQ:sqnO::";
12036 #else
12037 const char *md_shortopts = "qnO::";
12038 #endif
12039
12040 #define OPTION_32 (OPTION_MD_BASE + 0)
12041 #define OPTION_64 (OPTION_MD_BASE + 1)
12042 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12043 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12044 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12045 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12046 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12047 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12048 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12049 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12050 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12051 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12052 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12053 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12054 #define OPTION_X32 (OPTION_MD_BASE + 14)
12055 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12056 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12057 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12058 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12059 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12060 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12061 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12062 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12063 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12064 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12065 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12066 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12067 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12068 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12069 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12070 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12071
12072 struct option md_longopts[] =
12073 {
12074   {"32", no_argument, NULL, OPTION_32},
12075 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12076      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12077   {"64", no_argument, NULL, OPTION_64},
12078 #endif
12079 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12080   {"x32", no_argument, NULL, OPTION_X32},
12081   {"mshared", no_argument, NULL, OPTION_MSHARED},
12082   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12083 #endif
12084   {"divide", no_argument, NULL, OPTION_DIVIDE},
12085   {"march", required_argument, NULL, OPTION_MARCH},
12086   {"mtune", required_argument, NULL, OPTION_MTUNE},
12087   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12088   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12089   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12090   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12091   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12092   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12093   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12094   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12095   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12096   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12097   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12098   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12099 # if defined (TE_PE) || defined (TE_PEP)
12100   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12101 #endif
12102   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12103   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12104   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12105   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12106   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12107   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12108   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12109   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12110   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12111   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12112   {NULL, no_argument, NULL, 0}
12113 };
12114 size_t md_longopts_size = sizeof (md_longopts);
12115
12116 int
12117 md_parse_option (int c, const char *arg)
12118 {
12119   unsigned int j;
12120   char *arch, *next, *saved, *type;
12121
12122   switch (c)
12123     {
12124     case 'n':
12125       optimize_align_code = 0;
12126       break;
12127
12128     case 'q':
12129       quiet_warnings = 1;
12130       break;
12131
12132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12133       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12134          should be emitted or not.  FIXME: Not implemented.  */
12135     case 'Q':
12136       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12137         return 0;
12138       break;
12139
12140       /* -V: SVR4 argument to print version ID.  */
12141     case 'V':
12142       print_version_id ();
12143       break;
12144
12145       /* -k: Ignore for FreeBSD compatibility.  */
12146     case 'k':
12147       break;
12148
12149     case 's':
12150       /* -s: On i386 Solaris, this tells the native assembler to use
12151          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12152       break;
12153
12154     case OPTION_MSHARED:
12155       shared = 1;
12156       break;
12157
12158     case OPTION_X86_USED_NOTE:
12159       if (strcasecmp (arg, "yes") == 0)
12160         x86_used_note = 1;
12161       else if (strcasecmp (arg, "no") == 0)
12162         x86_used_note = 0;
12163       else
12164         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12165       break;
12166
12167
12168 #endif
12169 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12170      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12171     case OPTION_64:
12172       {
12173         const char **list, **l;
12174
12175         list = bfd_target_list ();
12176         for (l = list; *l != NULL; l++)
12177           if (CONST_STRNEQ (*l, "elf64-x86-64")
12178               || strcmp (*l, "coff-x86-64") == 0
12179               || strcmp (*l, "pe-x86-64") == 0
12180               || strcmp (*l, "pei-x86-64") == 0
12181               || strcmp (*l, "mach-o-x86-64") == 0)
12182             {
12183               default_arch = "x86_64";
12184               break;
12185             }
12186         if (*l == NULL)
12187           as_fatal (_("no compiled in support for x86_64"));
12188         free (list);
12189       }
12190       break;
12191 #endif
12192
12193 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12194     case OPTION_X32:
12195       if (IS_ELF)
12196         {
12197           const char **list, **l;
12198
12199           list = bfd_target_list ();
12200           for (l = list; *l != NULL; l++)
12201             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12202               {
12203                 default_arch = "x86_64:32";
12204                 break;
12205               }
12206           if (*l == NULL)
12207             as_fatal (_("no compiled in support for 32bit x86_64"));
12208           free (list);
12209         }
12210       else
12211         as_fatal (_("32bit x86_64 is only supported for ELF"));
12212       break;
12213 #endif
12214
12215     case OPTION_32:
12216       default_arch = "i386";
12217       break;
12218
12219     case OPTION_DIVIDE:
12220 #ifdef SVR4_COMMENT_CHARS
12221       {
12222         char *n, *t;
12223         const char *s;
12224
12225         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12226         t = n;
12227         for (s = i386_comment_chars; *s != '\0'; s++)
12228           if (*s != '/')
12229             *t++ = *s;
12230         *t = '\0';
12231         i386_comment_chars = n;
12232       }
12233 #endif
12234       break;
12235
12236     case OPTION_MARCH:
12237       saved = xstrdup (arg);
12238       arch = saved;
12239       /* Allow -march=+nosse.  */
12240       if (*arch == '+')
12241         arch++;
12242       do
12243         {
12244           if (*arch == '.')
12245             as_fatal (_("invalid -march= option: `%s'"), arg);
12246           next = strchr (arch, '+');
12247           if (next)
12248             *next++ = '\0';
12249           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12250             {
12251               if (strcmp (arch, cpu_arch [j].name) == 0)
12252                 {
12253                   /* Processor.  */
12254                   if (! cpu_arch[j].flags.bitfield.cpui386)
12255                     continue;
12256
12257                   cpu_arch_name = cpu_arch[j].name;
12258                   cpu_sub_arch_name = NULL;
12259                   cpu_arch_flags = cpu_arch[j].flags;
12260                   cpu_arch_isa = cpu_arch[j].type;
12261                   cpu_arch_isa_flags = cpu_arch[j].flags;
12262                   if (!cpu_arch_tune_set)
12263                     {
12264                       cpu_arch_tune = cpu_arch_isa;
12265                       cpu_arch_tune_flags = cpu_arch_isa_flags;
12266                     }
12267                   break;
12268                 }
12269               else if (*cpu_arch [j].name == '.'
12270                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
12271                 {
12272                   /* ISA extension.  */
12273                   i386_cpu_flags flags;
12274
12275                   flags = cpu_flags_or (cpu_arch_flags,
12276                                         cpu_arch[j].flags);
12277
12278                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12279                     {
12280                       if (cpu_sub_arch_name)
12281                         {
12282                           char *name = cpu_sub_arch_name;
12283                           cpu_sub_arch_name = concat (name,
12284                                                       cpu_arch[j].name,
12285                                                       (const char *) NULL);
12286                           free (name);
12287                         }
12288                       else
12289                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12290                       cpu_arch_flags = flags;
12291                       cpu_arch_isa_flags = flags;
12292                     }
12293                   else
12294                     cpu_arch_isa_flags
12295                       = cpu_flags_or (cpu_arch_isa_flags,
12296                                       cpu_arch[j].flags);
12297                   break;
12298                 }
12299             }
12300
12301           if (j >= ARRAY_SIZE (cpu_arch))
12302             {
12303               /* Disable an ISA extension.  */
12304               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12305                 if (strcmp (arch, cpu_noarch [j].name) == 0)
12306                   {
12307                     i386_cpu_flags flags;
12308
12309                     flags = cpu_flags_and_not (cpu_arch_flags,
12310                                                cpu_noarch[j].flags);
12311                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12312                       {
12313                         if (cpu_sub_arch_name)
12314                           {
12315                             char *name = cpu_sub_arch_name;
12316                             cpu_sub_arch_name = concat (arch,
12317                                                         (const char *) NULL);
12318                             free (name);
12319                           }
12320                         else
12321                           cpu_sub_arch_name = xstrdup (arch);
12322                         cpu_arch_flags = flags;
12323                         cpu_arch_isa_flags = flags;
12324                       }
12325                     break;
12326                   }
12327
12328               if (j >= ARRAY_SIZE (cpu_noarch))
12329                 j = ARRAY_SIZE (cpu_arch);
12330             }
12331
12332           if (j >= ARRAY_SIZE (cpu_arch))
12333             as_fatal (_("invalid -march= option: `%s'"), arg);
12334
12335           arch = next;
12336         }
12337       while (next != NULL);
12338       free (saved);
12339       break;
12340
12341     case OPTION_MTUNE:
12342       if (*arg == '.')
12343         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12344       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12345         {
12346           if (strcmp (arg, cpu_arch [j].name) == 0)
12347             {
12348               cpu_arch_tune_set = 1;
12349               cpu_arch_tune = cpu_arch [j].type;
12350               cpu_arch_tune_flags = cpu_arch[j].flags;
12351               break;
12352             }
12353         }
12354       if (j >= ARRAY_SIZE (cpu_arch))
12355         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12356       break;
12357
12358     case OPTION_MMNEMONIC:
12359       if (strcasecmp (arg, "att") == 0)
12360         intel_mnemonic = 0;
12361       else if (strcasecmp (arg, "intel") == 0)
12362         intel_mnemonic = 1;
12363       else
12364         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12365       break;
12366
12367     case OPTION_MSYNTAX:
12368       if (strcasecmp (arg, "att") == 0)
12369         intel_syntax = 0;
12370       else if (strcasecmp (arg, "intel") == 0)
12371         intel_syntax = 1;
12372       else
12373         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12374       break;
12375
12376     case OPTION_MINDEX_REG:
12377       allow_index_reg = 1;
12378       break;
12379
12380     case OPTION_MNAKED_REG:
12381       allow_naked_reg = 1;
12382       break;
12383
12384     case OPTION_MSSE2AVX:
12385       sse2avx = 1;
12386       break;
12387
12388     case OPTION_MSSE_CHECK:
12389       if (strcasecmp (arg, "error") == 0)
12390         sse_check = check_error;
12391       else if (strcasecmp (arg, "warning") == 0)
12392         sse_check = check_warning;
12393       else if (strcasecmp (arg, "none") == 0)
12394         sse_check = check_none;
12395       else
12396         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12397       break;
12398
12399     case OPTION_MOPERAND_CHECK:
12400       if (strcasecmp (arg, "error") == 0)
12401         operand_check = check_error;
12402       else if (strcasecmp (arg, "warning") == 0)
12403         operand_check = check_warning;
12404       else if (strcasecmp (arg, "none") == 0)
12405         operand_check = check_none;
12406       else
12407         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12408       break;
12409
12410     case OPTION_MAVXSCALAR:
12411       if (strcasecmp (arg, "128") == 0)
12412         avxscalar = vex128;
12413       else if (strcasecmp (arg, "256") == 0)
12414         avxscalar = vex256;
12415       else
12416         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12417       break;
12418
12419     case OPTION_MVEXWIG:
12420       if (strcmp (arg, "0") == 0)
12421         vexwig = vexw0;
12422       else if (strcmp (arg, "1") == 0)
12423         vexwig = vexw1;
12424       else
12425         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12426       break;
12427
12428     case OPTION_MADD_BND_PREFIX:
12429       add_bnd_prefix = 1;
12430       break;
12431
12432     case OPTION_MEVEXLIG:
12433       if (strcmp (arg, "128") == 0)
12434         evexlig = evexl128;
12435       else if (strcmp (arg, "256") == 0)
12436         evexlig = evexl256;
12437       else  if (strcmp (arg, "512") == 0)
12438         evexlig = evexl512;
12439       else
12440         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12441       break;
12442
12443     case OPTION_MEVEXRCIG:
12444       if (strcmp (arg, "rne") == 0)
12445         evexrcig = rne;
12446       else if (strcmp (arg, "rd") == 0)
12447         evexrcig = rd;
12448       else if (strcmp (arg, "ru") == 0)
12449         evexrcig = ru;
12450       else if (strcmp (arg, "rz") == 0)
12451         evexrcig = rz;
12452       else
12453         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12454       break;
12455
12456     case OPTION_MEVEXWIG:
12457       if (strcmp (arg, "0") == 0)
12458         evexwig = evexw0;
12459       else if (strcmp (arg, "1") == 0)
12460         evexwig = evexw1;
12461       else
12462         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12463       break;
12464
12465 # if defined (TE_PE) || defined (TE_PEP)
12466     case OPTION_MBIG_OBJ:
12467       use_big_obj = 1;
12468       break;
12469 #endif
12470
12471     case OPTION_MOMIT_LOCK_PREFIX:
12472       if (strcasecmp (arg, "yes") == 0)
12473         omit_lock_prefix = 1;
12474       else if (strcasecmp (arg, "no") == 0)
12475         omit_lock_prefix = 0;
12476       else
12477         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12478       break;
12479
12480     case OPTION_MFENCE_AS_LOCK_ADD:
12481       if (strcasecmp (arg, "yes") == 0)
12482         avoid_fence = 1;
12483       else if (strcasecmp (arg, "no") == 0)
12484         avoid_fence = 0;
12485       else
12486         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12487       break;
12488
12489     case OPTION_MRELAX_RELOCATIONS:
12490       if (strcasecmp (arg, "yes") == 0)
12491         generate_relax_relocations = 1;
12492       else if (strcasecmp (arg, "no") == 0)
12493         generate_relax_relocations = 0;
12494       else
12495         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12496       break;
12497
12498     case OPTION_MALIGN_BRANCH_BOUNDARY:
12499       {
12500         char *end;
12501         long int align = strtoul (arg, &end, 0);
12502         if (*end == '\0')
12503           {
12504             if (align == 0)
12505               {
12506                 align_branch_power = 0;
12507                 break;
12508               }
12509             else if (align >= 16)
12510               {
12511                 int align_power;
12512                 for (align_power = 0;
12513                      (align & 1) == 0;
12514                      align >>= 1, align_power++)
12515                   continue;
12516                 /* Limit alignment power to 31.  */
12517                 if (align == 1 && align_power < 32)
12518                   {
12519                     align_branch_power = align_power;
12520                     break;
12521                   }
12522               }
12523           }
12524         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12525       }
12526       break;
12527
12528     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12529       {
12530         char *end;
12531         int align = strtoul (arg, &end, 0);
12532         /* Some processors only support 5 prefixes.  */
12533         if (*end == '\0' && align >= 0 && align < 6)
12534           {
12535             align_branch_prefix_size = align;
12536             break;
12537           }
12538         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12539                   arg);
12540       }
12541       break;
12542
12543     case OPTION_MALIGN_BRANCH:
12544       align_branch = 0;
12545       saved = xstrdup (arg);
12546       type = saved;
12547       do
12548         {
12549           next = strchr (type, '+');
12550           if (next)
12551             *next++ = '\0';
12552           if (strcasecmp (type, "jcc") == 0)
12553             align_branch |= align_branch_jcc_bit;
12554           else if (strcasecmp (type, "fused") == 0)
12555             align_branch |= align_branch_fused_bit;
12556           else if (strcasecmp (type, "jmp") == 0)
12557             align_branch |= align_branch_jmp_bit;
12558           else if (strcasecmp (type, "call") == 0)
12559             align_branch |= align_branch_call_bit;
12560           else if (strcasecmp (type, "ret") == 0)
12561             align_branch |= align_branch_ret_bit;
12562           else if (strcasecmp (type, "indirect") == 0)
12563             align_branch |= align_branch_indirect_bit;
12564           else
12565             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12566           type = next;
12567         }
12568       while (next != NULL);
12569       free (saved);
12570       break;
12571
12572     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12573       align_branch_power = 5;
12574       align_branch_prefix_size = 5;
12575       align_branch = (align_branch_jcc_bit
12576                       | align_branch_fused_bit
12577                       | align_branch_jmp_bit);
12578       break;
12579
12580     case OPTION_MAMD64:
12581       isa64 = amd64;
12582       break;
12583
12584     case OPTION_MINTEL64:
12585       isa64 = intel64;
12586       break;
12587
12588     case 'O':
12589       if (arg == NULL)
12590         {
12591           optimize = 1;
12592           /* Turn off -Os.  */
12593           optimize_for_space = 0;
12594         }
12595       else if (*arg == 's')
12596         {
12597           optimize_for_space = 1;
12598           /* Turn on all encoding optimizations.  */
12599           optimize = INT_MAX;
12600         }
12601       else
12602         {
12603           optimize = atoi (arg);
12604           /* Turn off -Os.  */
12605           optimize_for_space = 0;
12606         }
12607       break;
12608
12609     default:
12610       return 0;
12611     }
12612   return 1;
12613 }
12614
12615 #define MESSAGE_TEMPLATE \
12616 "                                                                                "
12617
12618 static char *
12619 output_message (FILE *stream, char *p, char *message, char *start,
12620                 int *left_p, const char *name, int len)
12621 {
12622   int size = sizeof (MESSAGE_TEMPLATE);
12623   int left = *left_p;
12624
12625   /* Reserve 2 spaces for ", " or ",\0" */
12626   left -= len + 2;
12627
12628   /* Check if there is any room.  */
12629   if (left >= 0)
12630     {
12631       if (p != start)
12632         {
12633           *p++ = ',';
12634           *p++ = ' ';
12635         }
12636       p = mempcpy (p, name, len);
12637     }
12638   else
12639     {
12640       /* Output the current message now and start a new one.  */
12641       *p++ = ',';
12642       *p = '\0';
12643       fprintf (stream, "%s\n", message);
12644       p = start;
12645       left = size - (start - message) - len - 2;
12646
12647       gas_assert (left >= 0);
12648
12649       p = mempcpy (p, name, len);
12650     }
12651
12652   *left_p = left;
12653   return p;
12654 }
12655
12656 static void
12657 show_arch (FILE *stream, int ext, int check)
12658 {
12659   static char message[] = MESSAGE_TEMPLATE;
12660   char *start = message + 27;
12661   char *p;
12662   int size = sizeof (MESSAGE_TEMPLATE);
12663   int left;
12664   const char *name;
12665   int len;
12666   unsigned int j;
12667
12668   p = start;
12669   left = size - (start - message);
12670   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12671     {
12672       /* Should it be skipped?  */
12673       if (cpu_arch [j].skip)
12674         continue;
12675
12676       name = cpu_arch [j].name;
12677       len = cpu_arch [j].len;
12678       if (*name == '.')
12679         {
12680           /* It is an extension.  Skip if we aren't asked to show it.  */
12681           if (ext)
12682             {
12683               name++;
12684               len--;
12685             }
12686           else
12687             continue;
12688         }
12689       else if (ext)
12690         {
12691           /* It is an processor.  Skip if we show only extension.  */
12692           continue;
12693         }
12694       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12695         {
12696           /* It is an impossible processor - skip.  */
12697           continue;
12698         }
12699
12700       p = output_message (stream, p, message, start, &left, name, len);
12701     }
12702
12703   /* Display disabled extensions.  */
12704   if (ext)
12705     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12706       {
12707         name = cpu_noarch [j].name;
12708         len = cpu_noarch [j].len;
12709         p = output_message (stream, p, message, start, &left, name,
12710                             len);
12711       }
12712
12713   *p = '\0';
12714   fprintf (stream, "%s\n", message);
12715 }
12716
12717 void
12718 md_show_usage (FILE *stream)
12719 {
12720 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12721   fprintf (stream, _("\
12722   -Qy, -Qn                ignored\n\
12723   -V                      print assembler version number\n\
12724   -k                      ignored\n"));
12725 #endif
12726   fprintf (stream, _("\
12727   -n                      Do not optimize code alignment\n\
12728   -q                      quieten some warnings\n"));
12729 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12730   fprintf (stream, _("\
12731   -s                      ignored\n"));
12732 #endif
12733 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12734                       || defined (TE_PE) || defined (TE_PEP))
12735   fprintf (stream, _("\
12736   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
12737 #endif
12738 #ifdef SVR4_COMMENT_CHARS
12739   fprintf (stream, _("\
12740   --divide                do not treat `/' as a comment character\n"));
12741 #else
12742   fprintf (stream, _("\
12743   --divide                ignored\n"));
12744 #endif
12745   fprintf (stream, _("\
12746   -march=CPU[,+EXTENSION...]\n\
12747                           generate code for CPU and EXTENSION, CPU is one of:\n"));
12748   show_arch (stream, 0, 1);
12749   fprintf (stream, _("\
12750                           EXTENSION is combination of:\n"));
12751   show_arch (stream, 1, 0);
12752   fprintf (stream, _("\
12753   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
12754   show_arch (stream, 0, 0);
12755   fprintf (stream, _("\
12756   -msse2avx               encode SSE instructions with VEX prefix\n"));
12757   fprintf (stream, _("\
12758   -msse-check=[none|error|warning] (default: warning)\n\
12759                           check SSE instructions\n"));
12760   fprintf (stream, _("\
12761   -moperand-check=[none|error|warning] (default: warning)\n\
12762                           check operand combinations for validity\n"));
12763   fprintf (stream, _("\
12764   -mavxscalar=[128|256] (default: 128)\n\
12765                           encode scalar AVX instructions with specific vector\n\
12766                            length\n"));
12767   fprintf (stream, _("\
12768   -mvexwig=[0|1] (default: 0)\n\
12769                           encode VEX instructions with specific VEX.W value\n\
12770                            for VEX.W bit ignored instructions\n"));
12771   fprintf (stream, _("\
12772   -mevexlig=[128|256|512] (default: 128)\n\
12773                           encode scalar EVEX instructions with specific vector\n\
12774                            length\n"));
12775   fprintf (stream, _("\
12776   -mevexwig=[0|1] (default: 0)\n\
12777                           encode EVEX instructions with specific EVEX.W value\n\
12778                            for EVEX.W bit ignored instructions\n"));
12779   fprintf (stream, _("\
12780   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12781                           encode EVEX instructions with specific EVEX.RC value\n\
12782                            for SAE-only ignored instructions\n"));
12783   fprintf (stream, _("\
12784   -mmnemonic=[att|intel] "));
12785   if (SYSV386_COMPAT)
12786     fprintf (stream, _("(default: att)\n"));
12787   else
12788     fprintf (stream, _("(default: intel)\n"));
12789   fprintf (stream, _("\
12790                           use AT&T/Intel mnemonic\n"));
12791   fprintf (stream, _("\
12792   -msyntax=[att|intel] (default: att)\n\
12793                           use AT&T/Intel syntax\n"));
12794   fprintf (stream, _("\
12795   -mindex-reg             support pseudo index registers\n"));
12796   fprintf (stream, _("\
12797   -mnaked-reg             don't require `%%' prefix for registers\n"));
12798   fprintf (stream, _("\
12799   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
12800 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12801   fprintf (stream, _("\
12802   -mshared                disable branch optimization for shared code\n"));
12803   fprintf (stream, _("\
12804   -mx86-used-note=[no|yes] "));
12805   if (DEFAULT_X86_USED_NOTE)
12806     fprintf (stream, _("(default: yes)\n"));
12807   else
12808     fprintf (stream, _("(default: no)\n"));
12809   fprintf (stream, _("\
12810                           generate x86 used ISA and feature properties\n"));
12811 #endif
12812 #if defined (TE_PE) || defined (TE_PEP)
12813   fprintf (stream, _("\
12814   -mbig-obj               generate big object files\n"));
12815 #endif
12816   fprintf (stream, _("\
12817   -momit-lock-prefix=[no|yes] (default: no)\n\
12818                           strip all lock prefixes\n"));
12819   fprintf (stream, _("\
12820   -mfence-as-lock-add=[no|yes] (default: no)\n\
12821                           encode lfence, mfence and sfence as\n\
12822                            lock addl $0x0, (%%{re}sp)\n"));
12823   fprintf (stream, _("\
12824   -mrelax-relocations=[no|yes] "));
12825   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12826     fprintf (stream, _("(default: yes)\n"));
12827   else
12828     fprintf (stream, _("(default: no)\n"));
12829   fprintf (stream, _("\
12830                           generate relax relocations\n"));
12831   fprintf (stream, _("\
12832   -malign-branch-boundary=NUM (default: 0)\n\
12833                           align branches within NUM byte boundary\n"));
12834   fprintf (stream, _("\
12835   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12836                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
12837                            indirect\n\
12838                           specify types of branches to align\n"));
12839   fprintf (stream, _("\
12840   -malign-branch-prefix-size=NUM (default: 5)\n\
12841                           align branches with NUM prefixes per instruction\n"));
12842   fprintf (stream, _("\
12843   -mbranches-within-32B-boundaries\n\
12844                           align branches within 32 byte boundary\n"));
12845   fprintf (stream, _("\
12846   -mamd64                 accept only AMD64 ISA [default]\n"));
12847   fprintf (stream, _("\
12848   -mintel64               accept only Intel64 ISA\n"));
12849 }
12850
12851 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12852      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12853      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12854
12855 /* Pick the target format to use.  */
12856
12857 const char *
12858 i386_target_format (void)
12859 {
12860   if (!strncmp (default_arch, "x86_64", 6))
12861     {
12862       update_code_flag (CODE_64BIT, 1);
12863       if (default_arch[6] == '\0')
12864         x86_elf_abi = X86_64_ABI;
12865       else
12866         x86_elf_abi = X86_64_X32_ABI;
12867     }
12868   else if (!strcmp (default_arch, "i386"))
12869     update_code_flag (CODE_32BIT, 1);
12870   else if (!strcmp (default_arch, "iamcu"))
12871     {
12872       update_code_flag (CODE_32BIT, 1);
12873       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12874         {
12875           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12876           cpu_arch_name = "iamcu";
12877           cpu_sub_arch_name = NULL;
12878           cpu_arch_flags = iamcu_flags;
12879           cpu_arch_isa = PROCESSOR_IAMCU;
12880           cpu_arch_isa_flags = iamcu_flags;
12881           if (!cpu_arch_tune_set)
12882             {
12883               cpu_arch_tune = cpu_arch_isa;
12884               cpu_arch_tune_flags = cpu_arch_isa_flags;
12885             }
12886         }
12887       else if (cpu_arch_isa != PROCESSOR_IAMCU)
12888         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12889                   cpu_arch_name);
12890     }
12891   else
12892     as_fatal (_("unknown architecture"));
12893
12894   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12895     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12896   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12897     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12898
12899   switch (OUTPUT_FLAVOR)
12900     {
12901 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12902     case bfd_target_aout_flavour:
12903       return AOUT_TARGET_FORMAT;
12904 #endif
12905 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12906 # if defined (TE_PE) || defined (TE_PEP)
12907     case bfd_target_coff_flavour:
12908       if (flag_code == CODE_64BIT)
12909         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12910       else
12911         return "pe-i386";
12912 # elif defined (TE_GO32)
12913     case bfd_target_coff_flavour:
12914       return "coff-go32";
12915 # else
12916     case bfd_target_coff_flavour:
12917       return "coff-i386";
12918 # endif
12919 #endif
12920 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12921     case bfd_target_elf_flavour:
12922       {
12923         const char *format;
12924
12925         switch (x86_elf_abi)
12926           {
12927           default:
12928             format = ELF_TARGET_FORMAT;
12929 #ifndef TE_SOLARIS
12930             tls_get_addr = "___tls_get_addr";
12931 #endif
12932             break;
12933           case X86_64_ABI:
12934             use_rela_relocations = 1;
12935             object_64bit = 1;
12936 #ifndef TE_SOLARIS
12937             tls_get_addr = "__tls_get_addr";
12938 #endif
12939             format = ELF_TARGET_FORMAT64;
12940             break;
12941           case X86_64_X32_ABI:
12942             use_rela_relocations = 1;
12943             object_64bit = 1;
12944 #ifndef TE_SOLARIS
12945             tls_get_addr = "__tls_get_addr";
12946 #endif
12947             disallow_64bit_reloc = 1;
12948             format = ELF_TARGET_FORMAT32;
12949             break;
12950           }
12951         if (cpu_arch_isa == PROCESSOR_L1OM)
12952           {
12953             if (x86_elf_abi != X86_64_ABI)
12954               as_fatal (_("Intel L1OM is 64bit only"));
12955             return ELF_TARGET_L1OM_FORMAT;
12956           }
12957         else if (cpu_arch_isa == PROCESSOR_K1OM)
12958           {
12959             if (x86_elf_abi != X86_64_ABI)
12960               as_fatal (_("Intel K1OM is 64bit only"));
12961             return ELF_TARGET_K1OM_FORMAT;
12962           }
12963         else if (cpu_arch_isa == PROCESSOR_IAMCU)
12964           {
12965             if (x86_elf_abi != I386_ABI)
12966               as_fatal (_("Intel MCU is 32bit only"));
12967             return ELF_TARGET_IAMCU_FORMAT;
12968           }
12969         else
12970           return format;
12971       }
12972 #endif
12973 #if defined (OBJ_MACH_O)
12974     case bfd_target_mach_o_flavour:
12975       if (flag_code == CODE_64BIT)
12976         {
12977           use_rela_relocations = 1;
12978           object_64bit = 1;
12979           return "mach-o-x86-64";
12980         }
12981       else
12982         return "mach-o-i386";
12983 #endif
12984     default:
12985       abort ();
12986       return NULL;
12987     }
12988 }
12989
12990 #endif /* OBJ_MAYBE_ more than one  */
12991 \f
12992 symbolS *
12993 md_undefined_symbol (char *name)
12994 {
12995   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12996       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12997       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12998       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12999     {
13000       if (!GOT_symbol)
13001         {
13002           if (symbol_find (name))
13003             as_bad (_("GOT already in symbol table"));
13004           GOT_symbol = symbol_new (name, undefined_section,
13005                                    (valueT) 0, &zero_address_frag);
13006         };
13007       return GOT_symbol;
13008     }
13009   return 0;
13010 }
13011
13012 /* Round up a section size to the appropriate boundary.  */
13013
13014 valueT
13015 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13016 {
13017 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13018   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13019     {
13020       /* For a.out, force the section size to be aligned.  If we don't do
13021          this, BFD will align it for us, but it will not write out the
13022          final bytes of the section.  This may be a bug in BFD, but it is
13023          easier to fix it here since that is how the other a.out targets
13024          work.  */
13025       int align;
13026
13027       align = bfd_section_alignment (segment);
13028       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13029     }
13030 #endif
13031
13032   return size;
13033 }
13034
13035 /* On the i386, PC-relative offsets are relative to the start of the
13036    next instruction.  That is, the address of the offset, plus its
13037    size, since the offset is always the last part of the insn.  */
13038
13039 long
13040 md_pcrel_from (fixS *fixP)
13041 {
13042   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13043 }
13044
13045 #ifndef I386COFF
13046
13047 static void
13048 s_bss (int ignore ATTRIBUTE_UNUSED)
13049 {
13050   int temp;
13051
13052 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13053   if (IS_ELF)
13054     obj_elf_section_change_hook ();
13055 #endif
13056   temp = get_absolute_expression ();
13057   subseg_set (bss_section, (subsegT) temp);
13058   demand_empty_rest_of_line ();
13059 }
13060
13061 #endif
13062
13063 /* Remember constant directive.  */
13064
13065 void
13066 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13067 {
13068   if (last_insn.kind != last_insn_directive
13069       && (bfd_section_flags (now_seg) & SEC_CODE))
13070     {
13071       last_insn.seg = now_seg;
13072       last_insn.kind = last_insn_directive;
13073       last_insn.name = "constant directive";
13074       last_insn.file = as_where (&last_insn.line);
13075     }
13076 }
13077
13078 void
13079 i386_validate_fix (fixS *fixp)
13080 {
13081   if (fixp->fx_subsy)
13082     {
13083       if (fixp->fx_subsy == GOT_symbol)
13084         {
13085           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13086             {
13087               if (!object_64bit)
13088                 abort ();
13089 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13090               if (fixp->fx_tcbit2)
13091                 fixp->fx_r_type = (fixp->fx_tcbit
13092                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13093                                    : BFD_RELOC_X86_64_GOTPCRELX);
13094               else
13095 #endif
13096                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13097             }
13098           else
13099             {
13100               if (!object_64bit)
13101                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13102               else
13103                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13104             }
13105           fixp->fx_subsy = 0;
13106         }
13107     }
13108 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13109   else if (!object_64bit)
13110     {
13111       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13112           && fixp->fx_tcbit2)
13113         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13114     }
13115 #endif
13116 }
13117
13118 arelent *
13119 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13120 {
13121   arelent *rel;
13122   bfd_reloc_code_real_type code;
13123
13124   switch (fixp->fx_r_type)
13125     {
13126 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13127     case BFD_RELOC_SIZE32:
13128     case BFD_RELOC_SIZE64:
13129       if (S_IS_DEFINED (fixp->fx_addsy)
13130           && !S_IS_EXTERNAL (fixp->fx_addsy))
13131         {
13132           /* Resolve size relocation against local symbol to size of
13133              the symbol plus addend.  */
13134           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13135           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13136               && !fits_in_unsigned_long (value))
13137             as_bad_where (fixp->fx_file, fixp->fx_line,
13138                           _("symbol size computation overflow"));
13139           fixp->fx_addsy = NULL;
13140           fixp->fx_subsy = NULL;
13141           md_apply_fix (fixp, (valueT *) &value, NULL);
13142           return NULL;
13143         }
13144 #endif
13145       /* Fall through.  */
13146
13147     case BFD_RELOC_X86_64_PLT32:
13148     case BFD_RELOC_X86_64_GOT32:
13149     case BFD_RELOC_X86_64_GOTPCREL:
13150     case BFD_RELOC_X86_64_GOTPCRELX:
13151     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13152     case BFD_RELOC_386_PLT32:
13153     case BFD_RELOC_386_GOT32:
13154     case BFD_RELOC_386_GOT32X:
13155     case BFD_RELOC_386_GOTOFF:
13156     case BFD_RELOC_386_GOTPC:
13157     case BFD_RELOC_386_TLS_GD:
13158     case BFD_RELOC_386_TLS_LDM:
13159     case BFD_RELOC_386_TLS_LDO_32:
13160     case BFD_RELOC_386_TLS_IE_32:
13161     case BFD_RELOC_386_TLS_IE:
13162     case BFD_RELOC_386_TLS_GOTIE:
13163     case BFD_RELOC_386_TLS_LE_32:
13164     case BFD_RELOC_386_TLS_LE:
13165     case BFD_RELOC_386_TLS_GOTDESC:
13166     case BFD_RELOC_386_TLS_DESC_CALL:
13167     case BFD_RELOC_X86_64_TLSGD:
13168     case BFD_RELOC_X86_64_TLSLD:
13169     case BFD_RELOC_X86_64_DTPOFF32:
13170     case BFD_RELOC_X86_64_DTPOFF64:
13171     case BFD_RELOC_X86_64_GOTTPOFF:
13172     case BFD_RELOC_X86_64_TPOFF32:
13173     case BFD_RELOC_X86_64_TPOFF64:
13174     case BFD_RELOC_X86_64_GOTOFF64:
13175     case BFD_RELOC_X86_64_GOTPC32:
13176     case BFD_RELOC_X86_64_GOT64:
13177     case BFD_RELOC_X86_64_GOTPCREL64:
13178     case BFD_RELOC_X86_64_GOTPC64:
13179     case BFD_RELOC_X86_64_GOTPLT64:
13180     case BFD_RELOC_X86_64_PLTOFF64:
13181     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13182     case BFD_RELOC_X86_64_TLSDESC_CALL:
13183     case BFD_RELOC_RVA:
13184     case BFD_RELOC_VTABLE_ENTRY:
13185     case BFD_RELOC_VTABLE_INHERIT:
13186 #ifdef TE_PE
13187     case BFD_RELOC_32_SECREL:
13188 #endif
13189       code = fixp->fx_r_type;
13190       break;
13191     case BFD_RELOC_X86_64_32S:
13192       if (!fixp->fx_pcrel)
13193         {
13194           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
13195           code = fixp->fx_r_type;
13196           break;
13197         }
13198       /* Fall through.  */
13199     default:
13200       if (fixp->fx_pcrel)
13201         {
13202           switch (fixp->fx_size)
13203             {
13204             default:
13205               as_bad_where (fixp->fx_file, fixp->fx_line,
13206                             _("can not do %d byte pc-relative relocation"),
13207                             fixp->fx_size);
13208               code = BFD_RELOC_32_PCREL;
13209               break;
13210             case 1: code = BFD_RELOC_8_PCREL;  break;
13211             case 2: code = BFD_RELOC_16_PCREL; break;
13212             case 4: code = BFD_RELOC_32_PCREL; break;
13213 #ifdef BFD64
13214             case 8: code = BFD_RELOC_64_PCREL; break;
13215 #endif
13216             }
13217         }
13218       else
13219         {
13220           switch (fixp->fx_size)
13221             {
13222             default:
13223               as_bad_where (fixp->fx_file, fixp->fx_line,
13224                             _("can not do %d byte relocation"),
13225                             fixp->fx_size);
13226               code = BFD_RELOC_32;
13227               break;
13228             case 1: code = BFD_RELOC_8;  break;
13229             case 2: code = BFD_RELOC_16; break;
13230             case 4: code = BFD_RELOC_32; break;
13231 #ifdef BFD64
13232             case 8: code = BFD_RELOC_64; break;
13233 #endif
13234             }
13235         }
13236       break;
13237     }
13238
13239   if ((code == BFD_RELOC_32
13240        || code == BFD_RELOC_32_PCREL
13241        || code == BFD_RELOC_X86_64_32S)
13242       && GOT_symbol
13243       && fixp->fx_addsy == GOT_symbol)
13244     {
13245       if (!object_64bit)
13246         code = BFD_RELOC_386_GOTPC;
13247       else
13248         code = BFD_RELOC_X86_64_GOTPC32;
13249     }
13250   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13251       && GOT_symbol
13252       && fixp->fx_addsy == GOT_symbol)
13253     {
13254       code = BFD_RELOC_X86_64_GOTPC64;
13255     }
13256
13257   rel = XNEW (arelent);
13258   rel->sym_ptr_ptr = XNEW (asymbol *);
13259   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13260
13261   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13262
13263   if (!use_rela_relocations)
13264     {
13265       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13266          vtable entry to be used in the relocation's section offset.  */
13267       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13268         rel->address = fixp->fx_offset;
13269 #if defined (OBJ_COFF) && defined (TE_PE)
13270       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13271         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13272       else
13273 #endif
13274       rel->addend = 0;
13275     }
13276   /* Use the rela in 64bit mode.  */
13277   else
13278     {
13279       if (disallow_64bit_reloc)
13280         switch (code)
13281           {
13282           case BFD_RELOC_X86_64_DTPOFF64:
13283           case BFD_RELOC_X86_64_TPOFF64:
13284           case BFD_RELOC_64_PCREL:
13285           case BFD_RELOC_X86_64_GOTOFF64:
13286           case BFD_RELOC_X86_64_GOT64:
13287           case BFD_RELOC_X86_64_GOTPCREL64:
13288           case BFD_RELOC_X86_64_GOTPC64:
13289           case BFD_RELOC_X86_64_GOTPLT64:
13290           case BFD_RELOC_X86_64_PLTOFF64:
13291             as_bad_where (fixp->fx_file, fixp->fx_line,
13292                           _("cannot represent relocation type %s in x32 mode"),
13293                           bfd_get_reloc_code_name (code));
13294             break;
13295           default:
13296             break;
13297           }
13298
13299       if (!fixp->fx_pcrel)
13300         rel->addend = fixp->fx_offset;
13301       else
13302         switch (code)
13303           {
13304           case BFD_RELOC_X86_64_PLT32:
13305           case BFD_RELOC_X86_64_GOT32:
13306           case BFD_RELOC_X86_64_GOTPCREL:
13307           case BFD_RELOC_X86_64_GOTPCRELX:
13308           case BFD_RELOC_X86_64_REX_GOTPCRELX:
13309           case BFD_RELOC_X86_64_TLSGD:
13310           case BFD_RELOC_X86_64_TLSLD:
13311           case BFD_RELOC_X86_64_GOTTPOFF:
13312           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13313           case BFD_RELOC_X86_64_TLSDESC_CALL:
13314             rel->addend = fixp->fx_offset - fixp->fx_size;
13315             break;
13316           default:
13317             rel->addend = (section->vma
13318                            - fixp->fx_size
13319                            + fixp->fx_addnumber
13320                            + md_pcrel_from (fixp));
13321             break;
13322           }
13323     }
13324
13325   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13326   if (rel->howto == NULL)
13327     {
13328       as_bad_where (fixp->fx_file, fixp->fx_line,
13329                     _("cannot represent relocation type %s"),
13330                     bfd_get_reloc_code_name (code));
13331       /* Set howto to a garbage value so that we can keep going.  */
13332       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13333       gas_assert (rel->howto != NULL);
13334     }
13335
13336   return rel;
13337 }
13338
13339 #include "tc-i386-intel.c"
13340
13341 void
13342 tc_x86_parse_to_dw2regnum (expressionS *exp)
13343 {
13344   int saved_naked_reg;
13345   char saved_register_dot;
13346
13347   saved_naked_reg = allow_naked_reg;
13348   allow_naked_reg = 1;
13349   saved_register_dot = register_chars['.'];
13350   register_chars['.'] = '.';
13351   allow_pseudo_reg = 1;
13352   expression_and_evaluate (exp);
13353   allow_pseudo_reg = 0;
13354   register_chars['.'] = saved_register_dot;
13355   allow_naked_reg = saved_naked_reg;
13356
13357   if (exp->X_op == O_register && exp->X_add_number >= 0)
13358     {
13359       if ((addressT) exp->X_add_number < i386_regtab_size)
13360         {
13361           exp->X_op = O_constant;
13362           exp->X_add_number = i386_regtab[exp->X_add_number]
13363                               .dw2_regnum[flag_code >> 1];
13364         }
13365       else
13366         exp->X_op = O_illegal;
13367     }
13368 }
13369
13370 void
13371 tc_x86_frame_initial_instructions (void)
13372 {
13373   static unsigned int sp_regno[2];
13374
13375   if (!sp_regno[flag_code >> 1])
13376     {
13377       char *saved_input = input_line_pointer;
13378       char sp[][4] = {"esp", "rsp"};
13379       expressionS exp;
13380
13381       input_line_pointer = sp[flag_code >> 1];
13382       tc_x86_parse_to_dw2regnum (&exp);
13383       gas_assert (exp.X_op == O_constant);
13384       sp_regno[flag_code >> 1] = exp.X_add_number;
13385       input_line_pointer = saved_input;
13386     }
13387
13388   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13389   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13390 }
13391
13392 int
13393 x86_dwarf2_addr_size (void)
13394 {
13395 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13396   if (x86_elf_abi == X86_64_X32_ABI)
13397     return 4;
13398 #endif
13399   return bfd_arch_bits_per_address (stdoutput) / 8;
13400 }
13401
13402 int
13403 i386_elf_section_type (const char *str, size_t len)
13404 {
13405   if (flag_code == CODE_64BIT
13406       && len == sizeof ("unwind") - 1
13407       && strncmp (str, "unwind", 6) == 0)
13408     return SHT_X86_64_UNWIND;
13409
13410   return -1;
13411 }
13412
13413 #ifdef TE_SOLARIS
13414 void
13415 i386_solaris_fix_up_eh_frame (segT sec)
13416 {
13417   if (flag_code == CODE_64BIT)
13418     elf_section_type (sec) = SHT_X86_64_UNWIND;
13419 }
13420 #endif
13421
13422 #ifdef TE_PE
13423 void
13424 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13425 {
13426   expressionS exp;
13427
13428   exp.X_op = O_secrel;
13429   exp.X_add_symbol = symbol;
13430   exp.X_add_number = 0;
13431   emit_expr (&exp, size);
13432 }
13433 #endif
13434
13435 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13436 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
13437
13438 bfd_vma
13439 x86_64_section_letter (int letter, const char **ptr_msg)
13440 {
13441   if (flag_code == CODE_64BIT)
13442     {
13443       if (letter == 'l')
13444         return SHF_X86_64_LARGE;
13445
13446       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13447     }
13448   else
13449     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13450   return -1;
13451 }
13452
13453 bfd_vma
13454 x86_64_section_word (char *str, size_t len)
13455 {
13456   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13457     return SHF_X86_64_LARGE;
13458
13459   return -1;
13460 }
13461
13462 static void
13463 handle_large_common (int small ATTRIBUTE_UNUSED)
13464 {
13465   if (flag_code != CODE_64BIT)
13466     {
13467       s_comm_internal (0, elf_common_parse);
13468       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13469     }
13470   else
13471     {
13472       static segT lbss_section;
13473       asection *saved_com_section_ptr = elf_com_section_ptr;
13474       asection *saved_bss_section = bss_section;
13475
13476       if (lbss_section == NULL)
13477         {
13478           flagword applicable;
13479           segT seg = now_seg;
13480           subsegT subseg = now_subseg;
13481
13482           /* The .lbss section is for local .largecomm symbols.  */
13483           lbss_section = subseg_new (".lbss", 0);
13484           applicable = bfd_applicable_section_flags (stdoutput);
13485           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13486           seg_info (lbss_section)->bss = 1;
13487
13488           subseg_set (seg, subseg);
13489         }
13490
13491       elf_com_section_ptr = &_bfd_elf_large_com_section;
13492       bss_section = lbss_section;
13493
13494       s_comm_internal (0, elf_common_parse);
13495
13496       elf_com_section_ptr = saved_com_section_ptr;
13497       bss_section = saved_bss_section;
13498     }
13499 }
13500 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */