gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2020 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef REGISTER_WARNINGS
  48 #define REGISTER_WARNINGS 1
  49 #endif
  50
  51 #ifndef INFER_ADDR_PREFIX
  52 #define INFER_ADDR_PREFIX 1
  53 #endif
  54
  55 #ifndef DEFAULT_ARCH
  56 #define DEFAULT_ARCH "i386"
  57 #endif
  58
  59 #ifndef INLINE
  60 #if __GNUC__ >= 2
  61 #define INLINE __inline__
  62 #else
  63 #define INLINE
  64 #endif
  65 #endif
  66
  67 /* Prefixes will be emitted in the order defined below.
  68    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  69    instruction, and so must come before any prefixes.
  70    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  71    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  72 #define WAIT_PREFIX     0
  73 #define SEG_PREFIX      1
  74 #define ADDR_PREFIX     2
  75 #define DATA_PREFIX     3
  76 #define REP_PREFIX      4
  77 #define HLE_PREFIX      REP_PREFIX
  78 #define BND_PREFIX      REP_PREFIX
  79 #define LOCK_PREFIX     5
  80 #define REX_PREFIX      6       /* must come last.  */
  81 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  82
  83 /* we define the syntax here (modulo base,index,scale syntax) */
  84 #define REGISTER_PREFIX '%'
  85 #define IMMEDIATE_PREFIX '$'
  86 #define ABSOLUTE_PREFIX '*'
  87
  88 /* these are the instruction mnemonic suffixes in AT&T syntax or
  89    memory operand size in Intel syntax.  */
  90 #define WORD_MNEM_SUFFIX  'w'
  91 #define BYTE_MNEM_SUFFIX  'b'
  92 #define SHORT_MNEM_SUFFIX 's'
  93 #define LONG_MNEM_SUFFIX  'l'
  94 #define QWORD_MNEM_SUFFIX  'q'
  95 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  96    in instructions.  */
  97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  98
  99 #define END_OF_INSN '\0'
 100
 101 /* This matches the C -> StaticRounding alias in the opcode table.  */
 102 #define commutative staticrounding
 103
 104 /*
 105   'templates' is for grouping together 'template' structures for opcodes
 106   of the same name.  This is only used for storing the insns in the grand
 107   ole hash table of insns.
 108   The templates themselves start at START and range up to (but not including)
 109   END.
 110   */
 111 typedef struct
 112 {
 113   const insn_template *start;
 114   const insn_template *end;
 115 }
 116 templates;
 117
 118 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 119 typedef struct
 120 {
 121   unsigned int regmem;  /* codes register or memory operand */
 122   unsigned int reg;     /* codes register operand (or extended opcode) */
 123   unsigned int mode;    /* how to interpret regmem & reg */
 124 }
 125 modrm_byte;
 126
 127 /* x86-64 extension prefix.  */
 128 typedef int rex_byte;
 129
 130 /* 386 opcode byte to code indirect addressing.  */
 131 typedef struct
 132 {
 133   unsigned base;
 134   unsigned index;
 135   unsigned scale;
 136 }
 137 sib_byte;
 138
 139 /* x86 arch names, types and features */
 140 typedef struct
 141 {
 142   const char *name;             /* arch name */
 143   unsigned int len;             /* arch string length */
 144   enum processor_type type;     /* arch type */
 145   i386_cpu_flags flags;         /* cpu feature flags */
 146   unsigned int skip;            /* show_arch should skip this. */
 147 }
 148 arch_entry;
 149
 150 /* Used to turn off indicated flags.  */
 151 typedef struct
 152 {
 153   const char *name;             /* arch name */
 154   unsigned int len;             /* arch string length */
 155   i386_cpu_flags flags;         /* cpu feature flags */
 156 }
 157 noarch_entry;
 158
 159 static void update_code_flag (int, int);
 160 static void set_code_flag (int);
 161 static void set_16bit_gcc_code_flag (int);
 162 static void set_intel_syntax (int);
 163 static void set_intel_mnemonic (int);
 164 static void set_allow_index_reg (int);
 165 static void set_check (int);
 166 static void set_cpu_arch (int);
 167 #ifdef TE_PE
 168 static void pe_directive_secrel (int);
 169 #endif
 170 static void signed_cons (int);
 171 static char *output_invalid (int c);
 172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 173                                     const char *);
 174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 175                                        const char *);
 176 static int i386_att_operand (char *);
 177 static int i386_intel_operand (char *, int);
 178 static int i386_intel_simplify (expressionS *);
 179 static int i386_intel_parse_name (const char *, expressionS *);
 180 static const reg_entry *parse_register (char *, char **);
 181 static char *parse_insn (char *, char *);
 182 static char *parse_operands (char *, const char *);
 183 static void swap_operands (void);
 184 static void swap_2_operands (int, int);
 185 static enum flag_code i386_addressing_mode (void);
 186 static void optimize_imm (void);
 187 static void optimize_disp (void);
 188 static const insn_template *match_template (char);
 189 static int check_string (void);
 190 static int process_suffix (void);
 191 static int check_byte_reg (void);
 192 static int check_long_reg (void);
 193 static int check_qword_reg (void);
 194 static int check_word_reg (void);
 195 static int finalize_imm (void);
 196 static int process_operands (void);
 197 static const seg_entry *build_modrm_byte (void);
 198 static void output_insn (void);
 199 static void output_imm (fragS *, offsetT);
 200 static void output_disp (fragS *, offsetT);
 201 #ifndef I386COFF
 202 static void s_bss (int);
 203 #endif
 204 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 205 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 206
 207 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 208 static unsigned int x86_isa_1_used;
 209 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 210 static unsigned int x86_feature_2_used;
 211 /* Generate x86 used ISA and feature properties.  */
 212 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 213 #endif
 214
 215 static const char *default_arch = DEFAULT_ARCH;
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_vsib_address,
 294     invalid_vector_register_set,
 295     unsupported_vector_index_register,
 296     unsupported_broadcast,
 297     broadcast_needed,
 298     unsupported_masking,
 299     mask_not_on_destination,
 300     no_default_mask,
 301     unsupported_rc_sae,
 302     rc_sae_operand_not_last_imm,
 303     invalid_register_operand,
 304   };
 305
 306 struct _i386_insn
 307   {
 308     /* TM holds the template for the insn were currently assembling.  */
 309     insn_template tm;
 310
 311     /* SUFFIX holds the instruction size suffix for byte, word, dword
 312        or qword, if given.  */
 313     char suffix;
 314
 315     /* OPERANDS gives the number of given operands.  */
 316     unsigned int operands;
 317
 318     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 319        of given register, displacement, memory operands and immediate
 320        operands.  */
 321     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 322
 323     /* TYPES [i] is the type (see above #defines) which tells us how to
 324        use OP[i] for the corresponding operand.  */
 325     i386_operand_type types[MAX_OPERANDS];
 326
 327     /* Displacement expression, immediate expression, or register for each
 328        operand.  */
 329     union i386_op op[MAX_OPERANDS];
 330
 331     /* Flags for operands.  */
 332     unsigned int flags[MAX_OPERANDS];
 333 #define Operand_PCrel 1
 334 #define Operand_Mem   2
 335
 336     /* Relocation type for operand */
 337     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 338
 339     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 340        the base index byte below.  */
 341     const reg_entry *base_reg;
 342     const reg_entry *index_reg;
 343     unsigned int log2_scale_factor;
 344
 345     /* SEG gives the seg_entries of this insn.  They are zero unless
 346        explicit segment overrides are given.  */
 347     const seg_entry *seg[2];
 348
 349     /* Copied first memory operand string, for re-checking.  */
 350     char *memop1_string;
 351
 352     /* PREFIX holds all the given prefix opcodes (usually null).
 353        PREFIXES is the number of prefix opcodes.  */
 354     unsigned int prefixes;
 355     unsigned char prefix[MAX_PREFIXES];
 356
 357     /* The operand to a branch insn indicates an absolute branch.  */
 358     bfd_boolean jumpabsolute;
 359
 360     /* Has MMX register operands.  */
 361     bfd_boolean has_regmmx;
 362
 363     /* Has XMM register operands.  */
 364     bfd_boolean has_regxmm;
 365
 366     /* Has YMM register operands.  */
 367     bfd_boolean has_regymm;
 368
 369     /* Has ZMM register operands.  */
 370     bfd_boolean has_regzmm;
 371
 372     /* Has GOTPC or TLS relocation.  */
 373     bfd_boolean has_gotpc_tls_reloc;
 374
 375     /* RM and SIB are the modrm byte and the sib byte where the
 376        addressing modes of this insn are encoded.  */
 377     modrm_byte rm;
 378     rex_byte rex;
 379     rex_byte vrex;
 380     sib_byte sib;
 381     vex_prefix vex;
 382
 383     /* Masking attributes.  */
 384     struct Mask_Operation *mask;
 385
 386     /* Rounding control and SAE attributes.  */
 387     struct RC_Operation *rounding;
 388
 389     /* Broadcasting attributes.  */
 390     struct Broadcast_Operation *broadcast;
 391
 392     /* Compressed disp8*N attribute.  */
 393     unsigned int memshift;
 394
 395     /* Prefer load or store in encoding.  */
 396     enum
 397       {
 398         dir_encoding_default = 0,
 399         dir_encoding_load,
 400         dir_encoding_store,
 401         dir_encoding_swap
 402       } dir_encoding;
 403
 404     /* Prefer 8bit or 32bit displacement in encoding.  */
 405     enum
 406       {
 407         disp_encoding_default = 0,
 408         disp_encoding_8bit,
 409         disp_encoding_32bit
 410       } disp_encoding;
 411
 412     /* Prefer the REX byte in encoding.  */
 413     bfd_boolean rex_encoding;
 414
 415     /* Disable instruction size optimization.  */
 416     bfd_boolean no_optimize;
 417
 418     /* How to encode vector instructions.  */
 419     enum
 420       {
 421         vex_encoding_default = 0,
 422         vex_encoding_vex,
 423         vex_encoding_vex3,
 424         vex_encoding_evex
 425       } vec_encoding;
 426
 427     /* REP prefix.  */
 428     const char *rep_prefix;
 429
 430     /* HLE prefix.  */
 431     const char *hle_prefix;
 432
 433     /* Have BND prefix.  */
 434     const char *bnd_prefix;
 435
 436     /* Have NOTRACK prefix.  */
 437     const char *notrack_prefix;
 438
 439     /* Error message.  */
 440     enum i386_error error;
 441   };
 442
 443 typedef struct _i386_insn i386_insn;
 444
 445 /* Link RC type with corresponding string, that'll be looked for in
 446    asm.  */
 447 struct RC_name
 448 {
 449   enum rc_type type;
 450   const char *name;
 451   unsigned int len;
 452 };
 453
 454 static const struct RC_name RC_NamesTable[] =
 455 {
 456   {  rne, STRING_COMMA_LEN ("rn-sae") },
 457   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 458   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 459   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 460   {  saeonly,  STRING_COMMA_LEN ("sae") },
 461 };
 462
 463 /* List of chars besides those in app.c:symbol_chars that can start an
 464    operand.  Used to prevent the scrubber eating vital white-space.  */
 465 const char extra_symbol_chars[] = "*%-([{}"
 466 #ifdef LEX_AT
 467         "@"
 468 #endif
 469 #ifdef LEX_QM
 470         "?"
 471 #endif
 472         ;
 473
 474 #if (defined (TE_I386AIX)                               \
 475      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 476          && !defined (TE_GNU)                           \
 477          && !defined (TE_LINUX)                         \
 478          && !defined (TE_NACL)                          \
 479          && !defined (TE_FreeBSD)                       \
 480          && !defined (TE_DragonFly)                     \
 481          && !defined (TE_NetBSD)))
 482 /* This array holds the chars that always start a comment.  If the
 483    pre-processor is disabled, these aren't very useful.  The option
 484    --divide will remove '/' from this list.  */
 485 const char *i386_comment_chars = "#/";
 486 #define SVR4_COMMENT_CHARS 1
 487 #define PREFIX_SEPARATOR '\\'
 488
 489 #else
 490 const char *i386_comment_chars = "#";
 491 #define PREFIX_SEPARATOR '/'
 492 #endif
 493
 494 /* This array holds the chars that only start a comment at the beginning of
 495    a line.  If the line seems to have the form '# 123 filename'
 496    .line and .file directives will appear in the pre-processed output.
 497    Note that input_file.c hand checks for '#' at the beginning of the
 498    first line of the input file.  This is because the compiler outputs
 499    #NO_APP at the beginning of its output.
 500    Also note that comments started like this one will always work if
 501    '/' isn't otherwise defined.  */
 502 const char line_comment_chars[] = "#/";
 503
 504 const char line_separator_chars[] = ";";
 505
 506 /* Chars that can be used to separate mant from exp in floating point
 507    nums.  */
 508 const char EXP_CHARS[] = "eE";
 509
 510 /* Chars that mean this number is a floating point constant
 511    As in 0f12.456
 512    or    0d1.2345e12.  */
 513 const char FLT_CHARS[] = "fFdDxX";
 514
 515 /* Tables for lexical analysis.  */
 516 static char mnemonic_chars[256];
 517 static char register_chars[256];
 518 static char operand_chars[256];
 519 static char identifier_chars[256];
 520 static char digit_chars[256];
 521
 522 /* Lexical macros.  */
 523 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 524 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 525 #define is_register_char(x) (register_chars[(unsigned char) x])
 526 #define is_space_char(x) ((x) == ' ')
 527 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 528 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 529
 530 /* All non-digit non-letter characters that may occur in an operand.  */
 531 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 532
 533 /* md_assemble() always leaves the strings it's passed unaltered.  To
 534    effect this we maintain a stack of saved characters that we've smashed
 535    with '\0's (indicating end of strings for various sub-fields of the
 536    assembler instruction).  */
 537 static char save_stack[32];
 538 static char *save_stack_p;
 539 #define END_STRING_AND_SAVE(s) \
 540         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 541 #define RESTORE_END_STRING(s) \
 542         do { *(s) = *--save_stack_p; } while (0)
 543
 544 /* The instruction we're assembling.  */
 545 static i386_insn i;
 546
 547 /* Possible templates for current insn.  */
 548 static const templates *current_templates;
 549
 550 /* Per instruction expressionS buffers: max displacements & immediates.  */
 551 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 552 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 553
 554 /* Current operand we are working on.  */
 555 static int this_operand = -1;
 556
 557 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 558    these.  */
 559
 560 enum flag_code {
 561         CODE_32BIT,
 562         CODE_16BIT,
 563         CODE_64BIT };
 564
 565 static enum flag_code flag_code;
 566 static unsigned int object_64bit;
 567 static unsigned int disallow_64bit_reloc;
 568 static int use_rela_relocations = 0;
 569 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 570 static const char *tls_get_addr;
 571
 572 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 573      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 574      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 575
 576 /* The ELF ABI to use.  */
 577 enum x86_elf_abi
 578 {
 579   I386_ABI,
 580   X86_64_ABI,
 581   X86_64_X32_ABI
 582 };
 583
 584 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 585 #endif
 586
 587 #if defined (TE_PE) || defined (TE_PEP)
 588 /* Use big object file format.  */
 589 static int use_big_obj = 0;
 590 #endif
 591
 592 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 593 /* 1 if generating code for a shared library.  */
 594 static int shared = 0;
 595 #endif
 596
 597 /* 1 for intel syntax,
 598    0 if att syntax.  */
 599 static int intel_syntax = 0;
 600
 601 /* 1 for Intel64 ISA,
 602    0 if AMD64 ISA.  */
 603 static int intel64;
 604
 605 /* 1 for intel mnemonic,
 606    0 if att mnemonic.  */
 607 static int intel_mnemonic = !SYSV386_COMPAT;
 608
 609 /* 1 if pseudo registers are permitted.  */
 610 static int allow_pseudo_reg = 0;
 611
 612 /* 1 if register prefix % not required.  */
 613 static int allow_naked_reg = 0;
 614
 615 /* 1 if the assembler should add BND prefix for all control-transferring
 616    instructions supporting it, even if this prefix wasn't specified
 617    explicitly.  */
 618 static int add_bnd_prefix = 0;
 619
 620 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 621 static int allow_index_reg = 0;
 622
 623 /* 1 if the assembler should ignore LOCK prefix, even if it was
 624    specified explicitly.  */
 625 static int omit_lock_prefix = 0;
 626
 627 /* 1 if the assembler should encode lfence, mfence, and sfence as
 628    "lock addl $0, (%{re}sp)".  */
 629 static int avoid_fence = 0;
 630
 631 /* Type of the previous instruction.  */
 632 static struct
 633   {
 634     segT seg;
 635     const char *file;
 636     const char *name;
 637     unsigned int line;
 638     enum last_insn_kind
 639       {
 640         last_insn_other = 0,
 641         last_insn_directive,
 642         last_insn_prefix
 643       } kind;
 644   } last_insn;
 645
 646 /* 1 if the assembler should generate relax relocations.  */
 647
 648 static int generate_relax_relocations
 649   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 650
 651 static enum check_kind
 652   {
 653     check_none = 0,
 654     check_warning,
 655     check_error
 656   }
 657 sse_check, operand_check = check_warning;
 658
 659 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 660 static int align_branch_power = 0;
 661
 662 /* Types of branches to align.  */
 663 enum align_branch_kind
 664   {
 665     align_branch_none = 0,
 666     align_branch_jcc = 1,
 667     align_branch_fused = 2,
 668     align_branch_jmp = 3,
 669     align_branch_call = 4,
 670     align_branch_indirect = 5,
 671     align_branch_ret = 6
 672   };
 673
 674 /* Type bits of branches to align.  */
 675 enum align_branch_bit
 676   {
 677     align_branch_jcc_bit = 1 << align_branch_jcc,
 678     align_branch_fused_bit = 1 << align_branch_fused,
 679     align_branch_jmp_bit = 1 << align_branch_jmp,
 680     align_branch_call_bit = 1 << align_branch_call,
 681     align_branch_indirect_bit = 1 << align_branch_indirect,
 682     align_branch_ret_bit = 1 << align_branch_ret
 683   };
 684
 685 static unsigned int align_branch = (align_branch_jcc_bit
 686                                     | align_branch_fused_bit
 687                                     | align_branch_jmp_bit);
 688
 689 /* The maximum padding size for fused jcc.  CMP like instruction can
 690    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 691    prefixes.   */
 692 #define MAX_FUSED_JCC_PADDING_SIZE 20
 693
 694 /* The maximum number of prefixes added for an instruction.  */
 695 static unsigned int align_branch_prefix_size = 5;
 696
 697 /* Optimization:
 698    1. Clear the REX_W bit with register operand if possible.
 699    2. Above plus use 128bit vector instruction to clear the full vector
 700       register.
 701  */
 702 static int optimize = 0;
 703
 704 /* Optimization:
 705    1. Clear the REX_W bit with register operand if possible.
 706    2. Above plus use 128bit vector instruction to clear the full vector
 707       register.
 708    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 709       "testb $imm7,%r8".
 710  */
 711 static int optimize_for_space = 0;
 712
 713 /* Register prefix used for error message.  */
 714 static const char *register_prefix = "%";
 715
 716 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 717    leave, push, and pop instructions so that gcc has the same stack
 718    frame as in 32 bit mode.  */
 719 static char stackop_size = '\0';
 720
 721 /* Non-zero to optimize code alignment.  */
 722 int optimize_align_code = 1;
 723
 724 /* Non-zero to quieten some warnings.  */
 725 static int quiet_warnings = 0;
 726
 727 /* CPU name.  */
 728 static const char *cpu_arch_name = NULL;
 729 static char *cpu_sub_arch_name = NULL;
 730
 731 /* CPU feature flags.  */
 732 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 733
 734 /* If we have selected a cpu we are generating instructions for.  */
 735 static int cpu_arch_tune_set = 0;
 736
 737 /* Cpu we are generating instructions for.  */
 738 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 739
 740 /* CPU feature flags of cpu we are generating instructions for.  */
 741 static i386_cpu_flags cpu_arch_tune_flags;
 742
 743 /* CPU instruction set architecture used.  */
 744 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 745
 746 /* CPU feature flags of instruction set architecture used.  */
 747 i386_cpu_flags cpu_arch_isa_flags;
 748
 749 /* If set, conditional jumps are not automatically promoted to handle
 750    larger than a byte offset.  */
 751 static unsigned int no_cond_jump_promotion = 0;
 752
 753 /* Encode SSE instructions with VEX prefix.  */
 754 static unsigned int sse2avx;
 755
 756 /* Encode scalar AVX instructions with specific vector length.  */
 757 static enum
 758   {
 759     vex128 = 0,
 760     vex256
 761   } avxscalar;
 762
 763 /* Encode VEX WIG instructions with specific vex.w.  */
 764 static enum
 765   {
 766     vexw0 = 0,
 767     vexw1
 768   } vexwig;
 769
 770 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 771 static enum
 772   {
 773     evexl128 = 0,
 774     evexl256,
 775     evexl512
 776   } evexlig;
 777
 778 /* Encode EVEX WIG instructions with specific evex.w.  */
 779 static enum
 780   {
 781     evexw0 = 0,
 782     evexw1
 783   } evexwig;
 784
 785 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 786 static enum rc_type evexrcig = rne;
 787
 788 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 789 static symbolS *GOT_symbol;
 790
 791 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 792 unsigned int x86_dwarf2_return_column;
 793
 794 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 795 int x86_cie_data_alignment;
 796
 797 /* Interface to relax_segment.
 798    There are 3 major relax states for 386 jump insns because the
 799    different types of jumps add different sizes to frags when we're
 800    figuring out what sort of jump to choose to reach a given label.
 801
 802    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 803    branches which are handled by md_estimate_size_before_relax() and
 804    i386_generic_table_relax_frag().  */
 805
 806 /* Types.  */
 807 #define UNCOND_JUMP 0
 808 #define COND_JUMP 1
 809 #define COND_JUMP86 2
 810 #define BRANCH_PADDING 3
 811 #define BRANCH_PREFIX 4
 812 #define FUSED_JCC_PADDING 5
 813
 814 /* Sizes.  */
 815 #define CODE16  1
 816 #define SMALL   0
 817 #define SMALL16 (SMALL | CODE16)
 818 #define BIG     2
 819 #define BIG16   (BIG | CODE16)
 820
 821 #ifndef INLINE
 822 #ifdef __GNUC__
 823 #define INLINE __inline__
 824 #else
 825 #define INLINE
 826 #endif
 827 #endif
 828
 829 #define ENCODE_RELAX_STATE(type, size) \
 830   ((relax_substateT) (((type) << 2) | (size)))
 831 #define TYPE_FROM_RELAX_STATE(s) \
 832   ((s) >> 2)
 833 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 834     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 835
 836 /* This table is used by relax_frag to promote short jumps to long
 837    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 838    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 839    don't allow a short jump in a 32 bit code segment to be promoted to
 840    a 16 bit offset jump because it's slower (requires data size
 841    prefix), and doesn't work, unless the destination is in the bottom
 842    64k of the code segment (The top 16 bits of eip are zeroed).  */
 843
 844 const relax_typeS md_relax_table[] =
 845 {
 846   /* The fields are:
 847      1) most positive reach of this state,
 848      2) most negative reach of this state,
 849      3) how many bytes this mode will have in the variable part of the frag
 850      4) which index into the table to try if we can't fit into this one.  */
 851
 852   /* UNCOND_JUMP states.  */
 853   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 854   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 855   /* dword jmp adds 4 bytes to frag:
 856      0 extra opcode bytes, 4 displacement bytes.  */
 857   {0, 0, 4, 0},
 858   /* word jmp adds 2 byte2 to frag:
 859      0 extra opcode bytes, 2 displacement bytes.  */
 860   {0, 0, 2, 0},
 861
 862   /* COND_JUMP states.  */
 863   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 864   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 865   /* dword conditionals adds 5 bytes to frag:
 866      1 extra opcode byte, 4 displacement bytes.  */
 867   {0, 0, 5, 0},
 868   /* word conditionals add 3 bytes to frag:
 869      1 extra opcode byte, 2 displacement bytes.  */
 870   {0, 0, 3, 0},
 871
 872   /* COND_JUMP86 states.  */
 873   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 874   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 875   /* dword conditionals adds 5 bytes to frag:
 876      1 extra opcode byte, 4 displacement bytes.  */
 877   {0, 0, 5, 0},
 878   /* word conditionals add 4 bytes to frag:
 879      1 displacement byte and a 3 byte long branch insn.  */
 880   {0, 0, 4, 0}
 881 };
 882
 883 static const arch_entry cpu_arch[] =
 884 {
 885   /* Do not replace the first two entries - i386_target_format()
 886      relies on them being there in this order.  */
 887   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 888     CPU_GENERIC32_FLAGS, 0 },
 889   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 890     CPU_GENERIC64_FLAGS, 0 },
 891   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 892     CPU_NONE_FLAGS, 0 },
 893   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 894     CPU_I186_FLAGS, 0 },
 895   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 896     CPU_I286_FLAGS, 0 },
 897   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 898     CPU_I386_FLAGS, 0 },
 899   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 900     CPU_I486_FLAGS, 0 },
 901   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 902     CPU_I586_FLAGS, 0 },
 903   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 904     CPU_I686_FLAGS, 0 },
 905   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 906     CPU_I586_FLAGS, 0 },
 907   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 908     CPU_PENTIUMPRO_FLAGS, 0 },
 909   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 910     CPU_P2_FLAGS, 0 },
 911   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 912     CPU_P3_FLAGS, 0 },
 913   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 914     CPU_P4_FLAGS, 0 },
 915   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 916     CPU_CORE_FLAGS, 0 },
 917   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 918     CPU_NOCONA_FLAGS, 0 },
 919   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 920     CPU_CORE_FLAGS, 1 },
 921   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 922     CPU_CORE_FLAGS, 0 },
 923   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 924     CPU_CORE2_FLAGS, 1 },
 925   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 926     CPU_CORE2_FLAGS, 0 },
 927   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 928     CPU_COREI7_FLAGS, 0 },
 929   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 930     CPU_L1OM_FLAGS, 0 },
 931   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 932     CPU_K1OM_FLAGS, 0 },
 933   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 934     CPU_IAMCU_FLAGS, 0 },
 935   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 936     CPU_K6_FLAGS, 0 },
 937   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 938     CPU_K6_2_FLAGS, 0 },
 939   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 940     CPU_ATHLON_FLAGS, 0 },
 941   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 942     CPU_K8_FLAGS, 1 },
 943   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 944     CPU_K8_FLAGS, 0 },
 945   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 946     CPU_K8_FLAGS, 0 },
 947   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 948     CPU_AMDFAM10_FLAGS, 0 },
 949   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 950     CPU_BDVER1_FLAGS, 0 },
 951   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 952     CPU_BDVER2_FLAGS, 0 },
 953   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 954     CPU_BDVER3_FLAGS, 0 },
 955   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 956     CPU_BDVER4_FLAGS, 0 },
 957   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
 958     CPU_ZNVER1_FLAGS, 0 },
 959   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
 960     CPU_ZNVER2_FLAGS, 0 },
 961   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 962     CPU_BTVER1_FLAGS, 0 },
 963   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 964     CPU_BTVER2_FLAGS, 0 },
 965   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 966     CPU_8087_FLAGS, 0 },
 967   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 968     CPU_287_FLAGS, 0 },
 969   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 970     CPU_387_FLAGS, 0 },
 971   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
 972     CPU_687_FLAGS, 0 },
 973   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
 974     CPU_CMOV_FLAGS, 0 },
 975   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
 976     CPU_FXSR_FLAGS, 0 },
 977   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 978     CPU_MMX_FLAGS, 0 },
 979   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 980     CPU_SSE_FLAGS, 0 },
 981   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 982     CPU_SSE2_FLAGS, 0 },
 983   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 984     CPU_SSE3_FLAGS, 0 },
 985   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 986     CPU_SSSE3_FLAGS, 0 },
 987   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 988     CPU_SSE4_1_FLAGS, 0 },
 989   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 990     CPU_SSE4_2_FLAGS, 0 },
 991   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 992     CPU_SSE4_2_FLAGS, 0 },
 993   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 994     CPU_AVX_FLAGS, 0 },
 995   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 996     CPU_AVX2_FLAGS, 0 },
 997   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 998     CPU_AVX512F_FLAGS, 0 },
 999   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1000     CPU_AVX512CD_FLAGS, 0 },
1001   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1002     CPU_AVX512ER_FLAGS, 0 },
1003   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1004     CPU_AVX512PF_FLAGS, 0 },
1005   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1006     CPU_AVX512DQ_FLAGS, 0 },
1007   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1008     CPU_AVX512BW_FLAGS, 0 },
1009   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1010     CPU_AVX512VL_FLAGS, 0 },
1011   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1012     CPU_VMX_FLAGS, 0 },
1013   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1014     CPU_VMFUNC_FLAGS, 0 },
1015   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1016     CPU_SMX_FLAGS, 0 },
1017   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1018     CPU_XSAVE_FLAGS, 0 },
1019   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1020     CPU_XSAVEOPT_FLAGS, 0 },
1021   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1022     CPU_XSAVEC_FLAGS, 0 },
1023   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1024     CPU_XSAVES_FLAGS, 0 },
1025   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1026     CPU_AES_FLAGS, 0 },
1027   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1028     CPU_PCLMUL_FLAGS, 0 },
1029   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1030     CPU_PCLMUL_FLAGS, 1 },
1031   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1032     CPU_FSGSBASE_FLAGS, 0 },
1033   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1034     CPU_RDRND_FLAGS, 0 },
1035   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1036     CPU_F16C_FLAGS, 0 },
1037   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1038     CPU_BMI2_FLAGS, 0 },
1039   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1040     CPU_FMA_FLAGS, 0 },
1041   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1042     CPU_FMA4_FLAGS, 0 },
1043   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1044     CPU_XOP_FLAGS, 0 },
1045   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1046     CPU_LWP_FLAGS, 0 },
1047   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1048     CPU_MOVBE_FLAGS, 0 },
1049   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1050     CPU_CX16_FLAGS, 0 },
1051   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1052     CPU_EPT_FLAGS, 0 },
1053   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1054     CPU_LZCNT_FLAGS, 0 },
1055   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1056     CPU_HLE_FLAGS, 0 },
1057   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1058     CPU_RTM_FLAGS, 0 },
1059   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1060     CPU_INVPCID_FLAGS, 0 },
1061   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1062     CPU_CLFLUSH_FLAGS, 0 },
1063   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1064     CPU_NOP_FLAGS, 0 },
1065   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1066     CPU_SYSCALL_FLAGS, 0 },
1067   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1068     CPU_RDTSCP_FLAGS, 0 },
1069   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1070     CPU_3DNOW_FLAGS, 0 },
1071   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1072     CPU_3DNOWA_FLAGS, 0 },
1073   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1074     CPU_PADLOCK_FLAGS, 0 },
1075   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1076     CPU_SVME_FLAGS, 1 },
1077   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1078     CPU_SVME_FLAGS, 0 },
1079   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1080     CPU_SSE4A_FLAGS, 0 },
1081   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1082     CPU_ABM_FLAGS, 0 },
1083   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1084     CPU_BMI_FLAGS, 0 },
1085   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1086     CPU_TBM_FLAGS, 0 },
1087   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1088     CPU_ADX_FLAGS, 0 },
1089   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1090     CPU_RDSEED_FLAGS, 0 },
1091   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1092     CPU_PRFCHW_FLAGS, 0 },
1093   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1094     CPU_SMAP_FLAGS, 0 },
1095   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1096     CPU_MPX_FLAGS, 0 },
1097   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1098     CPU_SHA_FLAGS, 0 },
1099   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1100     CPU_CLFLUSHOPT_FLAGS, 0 },
1101   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1102     CPU_PREFETCHWT1_FLAGS, 0 },
1103   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1104     CPU_SE1_FLAGS, 0 },
1105   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1106     CPU_CLWB_FLAGS, 0 },
1107   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1108     CPU_AVX512IFMA_FLAGS, 0 },
1109   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1110     CPU_AVX512VBMI_FLAGS, 0 },
1111   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1112     CPU_AVX512_4FMAPS_FLAGS, 0 },
1113   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1114     CPU_AVX512_4VNNIW_FLAGS, 0 },
1115   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1116     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1117   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1118     CPU_AVX512_VBMI2_FLAGS, 0 },
1119   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1120     CPU_AVX512_VNNI_FLAGS, 0 },
1121   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1122     CPU_AVX512_BITALG_FLAGS, 0 },
1123   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1124     CPU_CLZERO_FLAGS, 0 },
1125   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1126     CPU_MWAITX_FLAGS, 0 },
1127   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1128     CPU_OSPKE_FLAGS, 0 },
1129   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1130     CPU_RDPID_FLAGS, 0 },
1131   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1132     CPU_PTWRITE_FLAGS, 0 },
1133   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1134     CPU_IBT_FLAGS, 0 },
1135   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1136     CPU_SHSTK_FLAGS, 0 },
1137   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1138     CPU_GFNI_FLAGS, 0 },
1139   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1140     CPU_VAES_FLAGS, 0 },
1141   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1142     CPU_VPCLMULQDQ_FLAGS, 0 },
1143   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1144     CPU_WBNOINVD_FLAGS, 0 },
1145   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1146     CPU_PCONFIG_FLAGS, 0 },
1147   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1148     CPU_WAITPKG_FLAGS, 0 },
1149   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1150     CPU_CLDEMOTE_FLAGS, 0 },
1151   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1152     CPU_MOVDIRI_FLAGS, 0 },
1153   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1154     CPU_MOVDIR64B_FLAGS, 0 },
1155   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1156     CPU_AVX512_BF16_FLAGS, 0 },
1157   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1158     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1159   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1160     CPU_ENQCMD_FLAGS, 0 },
1161   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1162     CPU_RDPRU_FLAGS, 0 },
1163   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1164     CPU_MCOMMIT_FLAGS, 0 },
1165 };
1166
1167 static const noarch_entry cpu_noarch[] =
1168 {
1169   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1170   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1171   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1172   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1173   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1174   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1175   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1176   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1177   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1178   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1179   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1180   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1181   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1182   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1183   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1184   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1185   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1186   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1187   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1188   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1189   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1190   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1191   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1192   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1193   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1194   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1195   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1196   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1197   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1198   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1199   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1200   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1201   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1202   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1203   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1204   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1205   { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1206   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1207 };
1208
1209 #ifdef I386COFF
1210 /* Like s_lcomm_internal in gas/read.c but the alignment string
1211    is allowed to be optional.  */
1212
1213 static symbolS *
1214 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1215 {
1216   addressT align = 0;
1217
1218   SKIP_WHITESPACE ();
1219
1220   if (needs_align
1221       && *input_line_pointer == ',')
1222     {
1223       align = parse_align (needs_align - 1);
1224
1225       if (align == (addressT) -1)
1226         return NULL;
1227     }
1228   else
1229     {
1230       if (size >= 8)
1231         align = 3;
1232       else if (size >= 4)
1233         align = 2;
1234       else if (size >= 2)
1235         align = 1;
1236       else
1237         align = 0;
1238     }
1239
1240   bss_alloc (symbolP, size, align);
1241   return symbolP;
1242 }
1243
1244 static void
1245 pe_lcomm (int needs_align)
1246 {
1247   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1248 }
1249 #endif
1250
1251 const pseudo_typeS md_pseudo_table[] =
1252 {
1253 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1254   {"align", s_align_bytes, 0},
1255 #else
1256   {"align", s_align_ptwo, 0},
1257 #endif
1258   {"arch", set_cpu_arch, 0},
1259 #ifndef I386COFF
1260   {"bss", s_bss, 0},
1261 #else
1262   {"lcomm", pe_lcomm, 1},
1263 #endif
1264   {"ffloat", float_cons, 'f'},
1265   {"dfloat", float_cons, 'd'},
1266   {"tfloat", float_cons, 'x'},
1267   {"value", cons, 2},
1268   {"slong", signed_cons, 4},
1269   {"noopt", s_ignore, 0},
1270   {"optim", s_ignore, 0},
1271   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1272   {"code16", set_code_flag, CODE_16BIT},
1273   {"code32", set_code_flag, CODE_32BIT},
1274 #ifdef BFD64
1275   {"code64", set_code_flag, CODE_64BIT},
1276 #endif
1277   {"intel_syntax", set_intel_syntax, 1},
1278   {"att_syntax", set_intel_syntax, 0},
1279   {"intel_mnemonic", set_intel_mnemonic, 1},
1280   {"att_mnemonic", set_intel_mnemonic, 0},
1281   {"allow_index_reg", set_allow_index_reg, 1},
1282   {"disallow_index_reg", set_allow_index_reg, 0},
1283   {"sse_check", set_check, 0},
1284   {"operand_check", set_check, 1},
1285 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1286   {"largecomm", handle_large_common, 0},
1287 #else
1288   {"file", dwarf2_directive_file, 0},
1289   {"loc", dwarf2_directive_loc, 0},
1290   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1291 #endif
1292 #ifdef TE_PE
1293   {"secrel32", pe_directive_secrel, 0},
1294 #endif
1295   {0, 0, 0}
1296 };
1297
1298 /* For interface with expression ().  */
1299 extern char *input_line_pointer;
1300
1301 /* Hash table for instruction mnemonic lookup.  */
1302 static struct hash_control *op_hash;
1303
1304 /* Hash table for register lookup.  */
1305 static struct hash_control *reg_hash;
1306 \f
1307   /* Various efficient no-op patterns for aligning code labels.
1308      Note: Don't try to assemble the instructions in the comments.
1309      0L and 0w are not legal.  */
1310 static const unsigned char f32_1[] =
1311   {0x90};                               /* nop                  */
1312 static const unsigned char f32_2[] =
1313   {0x66,0x90};                          /* xchg %ax,%ax         */
1314 static const unsigned char f32_3[] =
1315   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1316 static const unsigned char f32_4[] =
1317   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1318 static const unsigned char f32_6[] =
1319   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1320 static const unsigned char f32_7[] =
1321   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1322 static const unsigned char f16_3[] =
1323   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1324 static const unsigned char f16_4[] =
1325   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1326 static const unsigned char jump_disp8[] =
1327   {0xeb};                               /* jmp disp8           */
1328 static const unsigned char jump32_disp32[] =
1329   {0xe9};                               /* jmp disp32          */
1330 static const unsigned char jump16_disp32[] =
1331   {0x66,0xe9};                          /* jmp disp32          */
1332 /* 32-bit NOPs patterns.  */
1333 static const unsigned char *const f32_patt[] = {
1334   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1335 };
1336 /* 16-bit NOPs patterns.  */
1337 static const unsigned char *const f16_patt[] = {
1338   f32_1, f32_2, f16_3, f16_4
1339 };
1340 /* nopl (%[re]ax) */
1341 static const unsigned char alt_3[] =
1342   {0x0f,0x1f,0x00};
1343 /* nopl 0(%[re]ax) */
1344 static const unsigned char alt_4[] =
1345   {0x0f,0x1f,0x40,0x00};
1346 /* nopl 0(%[re]ax,%[re]ax,1) */
1347 static const unsigned char alt_5[] =
1348   {0x0f,0x1f,0x44,0x00,0x00};
1349 /* nopw 0(%[re]ax,%[re]ax,1) */
1350 static const unsigned char alt_6[] =
1351   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1352 /* nopl 0L(%[re]ax) */
1353 static const unsigned char alt_7[] =
1354   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1355 /* nopl 0L(%[re]ax,%[re]ax,1) */
1356 static const unsigned char alt_8[] =
1357   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1358 /* nopw 0L(%[re]ax,%[re]ax,1) */
1359 static const unsigned char alt_9[] =
1360   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1361 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1362 static const unsigned char alt_10[] =
1363   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1364 /* data16 nopw %cs:0L(%eax,%eax,1) */
1365 static const unsigned char alt_11[] =
1366   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1367 /* 32-bit and 64-bit NOPs patterns.  */
1368 static const unsigned char *const alt_patt[] = {
1369   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1370   alt_9, alt_10, alt_11
1371 };
1372
1373 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1374    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1375
1376 static void
1377 i386_output_nops (char *where, const unsigned char *const *patt,
1378                   int count, int max_single_nop_size)
1379
1380 {
1381   /* Place the longer NOP first.  */
1382   int last;
1383   int offset;
1384   const unsigned char *nops;
1385
1386   if (max_single_nop_size < 1)
1387     {
1388       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1389                 max_single_nop_size);
1390       return;
1391     }
1392
1393   nops = patt[max_single_nop_size - 1];
1394
1395   /* Use the smaller one if the requsted one isn't available.  */
1396   if (nops == NULL)
1397     {
1398       max_single_nop_size--;
1399       nops = patt[max_single_nop_size - 1];
1400     }
1401
1402   last = count % max_single_nop_size;
1403
1404   count -= last;
1405   for (offset = 0; offset < count; offset += max_single_nop_size)
1406     memcpy (where + offset, nops, max_single_nop_size);
1407
1408   if (last)
1409     {
1410       nops = patt[last - 1];
1411       if (nops == NULL)
1412         {
1413           /* Use the smaller one plus one-byte NOP if the needed one
1414              isn't available.  */
1415           last--;
1416           nops = patt[last - 1];
1417           memcpy (where + offset, nops, last);
1418           where[offset + last] = *patt[0];
1419         }
1420       else
1421         memcpy (where + offset, nops, last);
1422     }
1423 }
1424
1425 static INLINE int
1426 fits_in_imm7 (offsetT num)
1427 {
1428   return (num & 0x7f) == num;
1429 }
1430
1431 static INLINE int
1432 fits_in_imm31 (offsetT num)
1433 {
1434   return (num & 0x7fffffff) == num;
1435 }
1436
1437 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1438    single NOP instruction LIMIT.  */
1439
1440 void
1441 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1442 {
1443   const unsigned char *const *patt = NULL;
1444   int max_single_nop_size;
1445   /* Maximum number of NOPs before switching to jump over NOPs.  */
1446   int max_number_of_nops;
1447
1448   switch (fragP->fr_type)
1449     {
1450     case rs_fill_nop:
1451     case rs_align_code:
1452       break;
1453     case rs_machine_dependent:
1454       /* Allow NOP padding for jumps and calls.  */
1455       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1456           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1457         break;
1458       /* Fall through.  */
1459     default:
1460       return;
1461     }
1462
1463   /* We need to decide which NOP sequence to use for 32bit and
1464      64bit. When -mtune= is used:
1465
1466      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1467      PROCESSOR_GENERIC32, f32_patt will be used.
1468      2. For the rest, alt_patt will be used.
1469
1470      When -mtune= isn't used, alt_patt will be used if
1471      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1472      be used.
1473
1474      When -march= or .arch is used, we can't use anything beyond
1475      cpu_arch_isa_flags.   */
1476
1477   if (flag_code == CODE_16BIT)
1478     {
1479       patt = f16_patt;
1480       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1481       /* Limit number of NOPs to 2 in 16-bit mode.  */
1482       max_number_of_nops = 2;
1483     }
1484   else
1485     {
1486       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1487         {
1488           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1489           switch (cpu_arch_tune)
1490             {
1491             case PROCESSOR_UNKNOWN:
1492               /* We use cpu_arch_isa_flags to check if we SHOULD
1493                  optimize with nops.  */
1494               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1495                 patt = alt_patt;
1496               else
1497                 patt = f32_patt;
1498               break;
1499             case PROCESSOR_PENTIUM4:
1500             case PROCESSOR_NOCONA:
1501             case PROCESSOR_CORE:
1502             case PROCESSOR_CORE2:
1503             case PROCESSOR_COREI7:
1504             case PROCESSOR_L1OM:
1505             case PROCESSOR_K1OM:
1506             case PROCESSOR_GENERIC64:
1507             case PROCESSOR_K6:
1508             case PROCESSOR_ATHLON:
1509             case PROCESSOR_K8:
1510             case PROCESSOR_AMDFAM10:
1511             case PROCESSOR_BD:
1512             case PROCESSOR_ZNVER:
1513             case PROCESSOR_BT:
1514               patt = alt_patt;
1515               break;
1516             case PROCESSOR_I386:
1517             case PROCESSOR_I486:
1518             case PROCESSOR_PENTIUM:
1519             case PROCESSOR_PENTIUMPRO:
1520             case PROCESSOR_IAMCU:
1521             case PROCESSOR_GENERIC32:
1522               patt = f32_patt;
1523               break;
1524             }
1525         }
1526       else
1527         {
1528           switch (fragP->tc_frag_data.tune)
1529             {
1530             case PROCESSOR_UNKNOWN:
1531               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1532                  PROCESSOR_UNKNOWN.  */
1533               abort ();
1534               break;
1535
1536             case PROCESSOR_I386:
1537             case PROCESSOR_I486:
1538             case PROCESSOR_PENTIUM:
1539             case PROCESSOR_IAMCU:
1540             case PROCESSOR_K6:
1541             case PROCESSOR_ATHLON:
1542             case PROCESSOR_K8:
1543             case PROCESSOR_AMDFAM10:
1544             case PROCESSOR_BD:
1545             case PROCESSOR_ZNVER:
1546             case PROCESSOR_BT:
1547             case PROCESSOR_GENERIC32:
1548               /* We use cpu_arch_isa_flags to check if we CAN optimize
1549                  with nops.  */
1550               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1551                 patt = alt_patt;
1552               else
1553                 patt = f32_patt;
1554               break;
1555             case PROCESSOR_PENTIUMPRO:
1556             case PROCESSOR_PENTIUM4:
1557             case PROCESSOR_NOCONA:
1558             case PROCESSOR_CORE:
1559             case PROCESSOR_CORE2:
1560             case PROCESSOR_COREI7:
1561             case PROCESSOR_L1OM:
1562             case PROCESSOR_K1OM:
1563               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1564                 patt = alt_patt;
1565               else
1566                 patt = f32_patt;
1567               break;
1568             case PROCESSOR_GENERIC64:
1569               patt = alt_patt;
1570               break;
1571             }
1572         }
1573
1574       if (patt == f32_patt)
1575         {
1576           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1577           /* Limit number of NOPs to 2 for older processors.  */
1578           max_number_of_nops = 2;
1579         }
1580       else
1581         {
1582           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1583           /* Limit number of NOPs to 7 for newer processors.  */
1584           max_number_of_nops = 7;
1585         }
1586     }
1587
1588   if (limit == 0)
1589     limit = max_single_nop_size;
1590
1591   if (fragP->fr_type == rs_fill_nop)
1592     {
1593       /* Output NOPs for .nop directive.  */
1594       if (limit > max_single_nop_size)
1595         {
1596           as_bad_where (fragP->fr_file, fragP->fr_line,
1597                         _("invalid single nop size: %d "
1598                           "(expect within [0, %d])"),
1599                         limit, max_single_nop_size);
1600           return;
1601         }
1602     }
1603   else if (fragP->fr_type != rs_machine_dependent)
1604     fragP->fr_var = count;
1605
1606   if ((count / max_single_nop_size) > max_number_of_nops)
1607     {
1608       /* Generate jump over NOPs.  */
1609       offsetT disp = count - 2;
1610       if (fits_in_imm7 (disp))
1611         {
1612           /* Use "jmp disp8" if possible.  */
1613           count = disp;
1614           where[0] = jump_disp8[0];
1615           where[1] = count;
1616           where += 2;
1617         }
1618       else
1619         {
1620           unsigned int size_of_jump;
1621
1622           if (flag_code == CODE_16BIT)
1623             {
1624               where[0] = jump16_disp32[0];
1625               where[1] = jump16_disp32[1];
1626               size_of_jump = 2;
1627             }
1628           else
1629             {
1630               where[0] = jump32_disp32[0];
1631               size_of_jump = 1;
1632             }
1633
1634           count -= size_of_jump + 4;
1635           if (!fits_in_imm31 (count))
1636             {
1637               as_bad_where (fragP->fr_file, fragP->fr_line,
1638                             _("jump over nop padding out of range"));
1639               return;
1640             }
1641
1642           md_number_to_chars (where + size_of_jump, count, 4);
1643           where += size_of_jump + 4;
1644         }
1645     }
1646
1647   /* Generate multiple NOPs.  */
1648   i386_output_nops (where, patt, count, limit);
1649 }
1650
1651 static INLINE int
1652 operand_type_all_zero (const union i386_operand_type *x)
1653 {
1654   switch (ARRAY_SIZE(x->array))
1655     {
1656     case 3:
1657       if (x->array[2])
1658         return 0;
1659       /* Fall through.  */
1660     case 2:
1661       if (x->array[1])
1662         return 0;
1663       /* Fall through.  */
1664     case 1:
1665       return !x->array[0];
1666     default:
1667       abort ();
1668     }
1669 }
1670
1671 static INLINE void
1672 operand_type_set (union i386_operand_type *x, unsigned int v)
1673 {
1674   switch (ARRAY_SIZE(x->array))
1675     {
1676     case 3:
1677       x->array[2] = v;
1678       /* Fall through.  */
1679     case 2:
1680       x->array[1] = v;
1681       /* Fall through.  */
1682     case 1:
1683       x->array[0] = v;
1684       /* Fall through.  */
1685       break;
1686     default:
1687       abort ();
1688     }
1689
1690   x->bitfield.class = ClassNone;
1691   x->bitfield.instance = InstanceNone;
1692 }
1693
1694 static INLINE int
1695 operand_type_equal (const union i386_operand_type *x,
1696                     const union i386_operand_type *y)
1697 {
1698   switch (ARRAY_SIZE(x->array))
1699     {
1700     case 3:
1701       if (x->array[2] != y->array[2])
1702         return 0;
1703       /* Fall through.  */
1704     case 2:
1705       if (x->array[1] != y->array[1])
1706         return 0;
1707       /* Fall through.  */
1708     case 1:
1709       return x->array[0] == y->array[0];
1710       break;
1711     default:
1712       abort ();
1713     }
1714 }
1715
1716 static INLINE int
1717 cpu_flags_all_zero (const union i386_cpu_flags *x)
1718 {
1719   switch (ARRAY_SIZE(x->array))
1720     {
1721     case 4:
1722       if (x->array[3])
1723         return 0;
1724       /* Fall through.  */
1725     case 3:
1726       if (x->array[2])
1727         return 0;
1728       /* Fall through.  */
1729     case 2:
1730       if (x->array[1])
1731         return 0;
1732       /* Fall through.  */
1733     case 1:
1734       return !x->array[0];
1735     default:
1736       abort ();
1737     }
1738 }
1739
1740 static INLINE int
1741 cpu_flags_equal (const union i386_cpu_flags *x,
1742                  const union i386_cpu_flags *y)
1743 {
1744   switch (ARRAY_SIZE(x->array))
1745     {
1746     case 4:
1747       if (x->array[3] != y->array[3])
1748         return 0;
1749       /* Fall through.  */
1750     case 3:
1751       if (x->array[2] != y->array[2])
1752         return 0;
1753       /* Fall through.  */
1754     case 2:
1755       if (x->array[1] != y->array[1])
1756         return 0;
1757       /* Fall through.  */
1758     case 1:
1759       return x->array[0] == y->array[0];
1760       break;
1761     default:
1762       abort ();
1763     }
1764 }
1765
1766 static INLINE int
1767 cpu_flags_check_cpu64 (i386_cpu_flags f)
1768 {
1769   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1770            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1771 }
1772
1773 static INLINE i386_cpu_flags
1774 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1775 {
1776   switch (ARRAY_SIZE (x.array))
1777     {
1778     case 4:
1779       x.array [3] &= y.array [3];
1780       /* Fall through.  */
1781     case 3:
1782       x.array [2] &= y.array [2];
1783       /* Fall through.  */
1784     case 2:
1785       x.array [1] &= y.array [1];
1786       /* Fall through.  */
1787     case 1:
1788       x.array [0] &= y.array [0];
1789       break;
1790     default:
1791       abort ();
1792     }
1793   return x;
1794 }
1795
1796 static INLINE i386_cpu_flags
1797 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1798 {
1799   switch (ARRAY_SIZE (x.array))
1800     {
1801     case 4:
1802       x.array [3] |= y.array [3];
1803       /* Fall through.  */
1804     case 3:
1805       x.array [2] |= y.array [2];
1806       /* Fall through.  */
1807     case 2:
1808       x.array [1] |= y.array [1];
1809       /* Fall through.  */
1810     case 1:
1811       x.array [0] |= y.array [0];
1812       break;
1813     default:
1814       abort ();
1815     }
1816   return x;
1817 }
1818
1819 static INLINE i386_cpu_flags
1820 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1821 {
1822   switch (ARRAY_SIZE (x.array))
1823     {
1824     case 4:
1825       x.array [3] &= ~y.array [3];
1826       /* Fall through.  */
1827     case 3:
1828       x.array [2] &= ~y.array [2];
1829       /* Fall through.  */
1830     case 2:
1831       x.array [1] &= ~y.array [1];
1832       /* Fall through.  */
1833     case 1:
1834       x.array [0] &= ~y.array [0];
1835       break;
1836     default:
1837       abort ();
1838     }
1839   return x;
1840 }
1841
1842 #define CPU_FLAGS_ARCH_MATCH            0x1
1843 #define CPU_FLAGS_64BIT_MATCH           0x2
1844
1845 #define CPU_FLAGS_PERFECT_MATCH \
1846   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1847
1848 /* Return CPU flags match bits. */
1849
1850 static int
1851 cpu_flags_match (const insn_template *t)
1852 {
1853   i386_cpu_flags x = t->cpu_flags;
1854   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1855
1856   x.bitfield.cpu64 = 0;
1857   x.bitfield.cpuno64 = 0;
1858
1859   if (cpu_flags_all_zero (&x))
1860     {
1861       /* This instruction is available on all archs.  */
1862       match |= CPU_FLAGS_ARCH_MATCH;
1863     }
1864   else
1865     {
1866       /* This instruction is available only on some archs.  */
1867       i386_cpu_flags cpu = cpu_arch_flags;
1868
1869       /* AVX512VL is no standalone feature - match it and then strip it.  */
1870       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1871         return match;
1872       x.bitfield.cpuavx512vl = 0;
1873
1874       cpu = cpu_flags_and (x, cpu);
1875       if (!cpu_flags_all_zero (&cpu))
1876         {
1877           if (x.bitfield.cpuavx)
1878             {
1879               /* We need to check a few extra flags with AVX.  */
1880               if (cpu.bitfield.cpuavx
1881                   && (!t->opcode_modifier.sse2avx || sse2avx)
1882                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1883                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1884                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1885                 match |= CPU_FLAGS_ARCH_MATCH;
1886             }
1887           else if (x.bitfield.cpuavx512f)
1888             {
1889               /* We need to check a few extra flags with AVX512F.  */
1890               if (cpu.bitfield.cpuavx512f
1891                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1892                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1893                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1894                 match |= CPU_FLAGS_ARCH_MATCH;
1895             }
1896           else
1897             match |= CPU_FLAGS_ARCH_MATCH;
1898         }
1899     }
1900   return match;
1901 }
1902
1903 static INLINE i386_operand_type
1904 operand_type_and (i386_operand_type x, i386_operand_type y)
1905 {
1906   if (x.bitfield.class != y.bitfield.class)
1907     x.bitfield.class = ClassNone;
1908   if (x.bitfield.instance != y.bitfield.instance)
1909     x.bitfield.instance = InstanceNone;
1910
1911   switch (ARRAY_SIZE (x.array))
1912     {
1913     case 3:
1914       x.array [2] &= y.array [2];
1915       /* Fall through.  */
1916     case 2:
1917       x.array [1] &= y.array [1];
1918       /* Fall through.  */
1919     case 1:
1920       x.array [0] &= y.array [0];
1921       break;
1922     default:
1923       abort ();
1924     }
1925   return x;
1926 }
1927
1928 static INLINE i386_operand_type
1929 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1930 {
1931   gas_assert (y.bitfield.class == ClassNone);
1932   gas_assert (y.bitfield.instance == InstanceNone);
1933
1934   switch (ARRAY_SIZE (x.array))
1935     {
1936     case 3:
1937       x.array [2] &= ~y.array [2];
1938       /* Fall through.  */
1939     case 2:
1940       x.array [1] &= ~y.array [1];
1941       /* Fall through.  */
1942     case 1:
1943       x.array [0] &= ~y.array [0];
1944       break;
1945     default:
1946       abort ();
1947     }
1948   return x;
1949 }
1950
1951 static INLINE i386_operand_type
1952 operand_type_or (i386_operand_type x, i386_operand_type y)
1953 {
1954   gas_assert (x.bitfield.class == ClassNone ||
1955               y.bitfield.class == ClassNone ||
1956               x.bitfield.class == y.bitfield.class);
1957   gas_assert (x.bitfield.instance == InstanceNone ||
1958               y.bitfield.instance == InstanceNone ||
1959               x.bitfield.instance == y.bitfield.instance);
1960
1961   switch (ARRAY_SIZE (x.array))
1962     {
1963     case 3:
1964       x.array [2] |= y.array [2];
1965       /* Fall through.  */
1966     case 2:
1967       x.array [1] |= y.array [1];
1968       /* Fall through.  */
1969     case 1:
1970       x.array [0] |= y.array [0];
1971       break;
1972     default:
1973       abort ();
1974     }
1975   return x;
1976 }
1977
1978 static INLINE i386_operand_type
1979 operand_type_xor (i386_operand_type x, i386_operand_type y)
1980 {
1981   gas_assert (y.bitfield.class == ClassNone);
1982   gas_assert (y.bitfield.instance == InstanceNone);
1983
1984   switch (ARRAY_SIZE (x.array))
1985     {
1986     case 3:
1987       x.array [2] ^= y.array [2];
1988       /* Fall through.  */
1989     case 2:
1990       x.array [1] ^= y.array [1];
1991       /* Fall through.  */
1992     case 1:
1993       x.array [0] ^= y.array [0];
1994       break;
1995     default:
1996       abort ();
1997     }
1998   return x;
1999 }
2000
2001 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2002 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2003 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2004 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2005 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2006 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2007 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2008 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2009 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2010 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2011 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2012 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2013 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2014 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2015 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2016 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2017 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2018
2019 enum operand_type
2020 {
2021   reg,
2022   imm,
2023   disp,
2024   anymem
2025 };
2026
2027 static INLINE int
2028 operand_type_check (i386_operand_type t, enum operand_type c)
2029 {
2030   switch (c)
2031     {
2032     case reg:
2033       return t.bitfield.class == Reg;
2034
2035     case imm:
2036       return (t.bitfield.imm8
2037               || t.bitfield.imm8s
2038               || t.bitfield.imm16
2039               || t.bitfield.imm32
2040               || t.bitfield.imm32s
2041               || t.bitfield.imm64);
2042
2043     case disp:
2044       return (t.bitfield.disp8
2045               || t.bitfield.disp16
2046               || t.bitfield.disp32
2047               || t.bitfield.disp32s
2048               || t.bitfield.disp64);
2049
2050     case anymem:
2051       return (t.bitfield.disp8
2052               || t.bitfield.disp16
2053               || t.bitfield.disp32
2054               || t.bitfield.disp32s
2055               || t.bitfield.disp64
2056               || t.bitfield.baseindex);
2057
2058     default:
2059       abort ();
2060     }
2061
2062   return 0;
2063 }
2064
2065 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2066    between operand GIVEN and opeand WANTED for instruction template T.  */
2067
2068 static INLINE int
2069 match_operand_size (const insn_template *t, unsigned int wanted,
2070                     unsigned int given)
2071 {
2072   return !((i.types[given].bitfield.byte
2073             && !t->operand_types[wanted].bitfield.byte)
2074            || (i.types[given].bitfield.word
2075                && !t->operand_types[wanted].bitfield.word)
2076            || (i.types[given].bitfield.dword
2077                && !t->operand_types[wanted].bitfield.dword)
2078            || (i.types[given].bitfield.qword
2079                && !t->operand_types[wanted].bitfield.qword)
2080            || (i.types[given].bitfield.tbyte
2081                && !t->operand_types[wanted].bitfield.tbyte));
2082 }
2083
2084 /* Return 1 if there is no conflict in SIMD register between operand
2085    GIVEN and opeand WANTED for instruction template T.  */
2086
2087 static INLINE int
2088 match_simd_size (const insn_template *t, unsigned int wanted,
2089                  unsigned int given)
2090 {
2091   return !((i.types[given].bitfield.xmmword
2092             && !t->operand_types[wanted].bitfield.xmmword)
2093            || (i.types[given].bitfield.ymmword
2094                && !t->operand_types[wanted].bitfield.ymmword)
2095            || (i.types[given].bitfield.zmmword
2096                && !t->operand_types[wanted].bitfield.zmmword));
2097 }
2098
2099 /* Return 1 if there is no conflict in any size between operand GIVEN
2100    and opeand WANTED for instruction template T.  */
2101
2102 static INLINE int
2103 match_mem_size (const insn_template *t, unsigned int wanted,
2104                 unsigned int given)
2105 {
2106   return (match_operand_size (t, wanted, given)
2107           && !((i.types[given].bitfield.unspecified
2108                 && !i.broadcast
2109                 && !t->operand_types[wanted].bitfield.unspecified)
2110                || (i.types[given].bitfield.fword
2111                    && !t->operand_types[wanted].bitfield.fword)
2112                /* For scalar opcode templates to allow register and memory
2113                   operands at the same time, some special casing is needed
2114                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2115                   down-conversion vpmov*.  */
2116                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2117                     && !t->opcode_modifier.broadcast
2118                     && (t->operand_types[wanted].bitfield.byte
2119                         || t->operand_types[wanted].bitfield.word
2120                         || t->operand_types[wanted].bitfield.dword
2121                         || t->operand_types[wanted].bitfield.qword))
2122                    ? (i.types[given].bitfield.xmmword
2123                       || i.types[given].bitfield.ymmword
2124                       || i.types[given].bitfield.zmmword)
2125                    : !match_simd_size(t, wanted, given))));
2126 }
2127
2128 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2129    operands for instruction template T, and it has MATCH_REVERSE set if there
2130    is no size conflict on any operands for the template with operands reversed
2131    (and the template allows for reversing in the first place).  */
2132
2133 #define MATCH_STRAIGHT 1
2134 #define MATCH_REVERSE  2
2135
2136 static INLINE unsigned int
2137 operand_size_match (const insn_template *t)
2138 {
2139   unsigned int j, match = MATCH_STRAIGHT;
2140
2141   /* Don't check non-absolute jump instructions.  */
2142   if (t->opcode_modifier.jump
2143       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2144     return match;
2145
2146   /* Check memory and accumulator operand size.  */
2147   for (j = 0; j < i.operands; j++)
2148     {
2149       if (i.types[j].bitfield.class != Reg
2150           && i.types[j].bitfield.class != RegSIMD
2151           && t->opcode_modifier.anysize)
2152         continue;
2153
2154       if (t->operand_types[j].bitfield.class == Reg
2155           && !match_operand_size (t, j, j))
2156         {
2157           match = 0;
2158           break;
2159         }
2160
2161       if (t->operand_types[j].bitfield.class == RegSIMD
2162           && !match_simd_size (t, j, j))
2163         {
2164           match = 0;
2165           break;
2166         }
2167
2168       if (t->operand_types[j].bitfield.instance == Accum
2169           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2170         {
2171           match = 0;
2172           break;
2173         }
2174
2175       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2176         {
2177           match = 0;
2178           break;
2179         }
2180     }
2181
2182   if (!t->opcode_modifier.d)
2183     {
2184 mismatch:
2185       if (!match)
2186         i.error = operand_size_mismatch;
2187       return match;
2188     }
2189
2190   /* Check reverse.  */
2191   gas_assert (i.operands >= 2 && i.operands <= 3);
2192
2193   for (j = 0; j < i.operands; j++)
2194     {
2195       unsigned int given = i.operands - j - 1;
2196
2197       if (t->operand_types[j].bitfield.class == Reg
2198           && !match_operand_size (t, j, given))
2199         goto mismatch;
2200
2201       if (t->operand_types[j].bitfield.class == RegSIMD
2202           && !match_simd_size (t, j, given))
2203         goto mismatch;
2204
2205       if (t->operand_types[j].bitfield.instance == Accum
2206           && (!match_operand_size (t, j, given)
2207               || !match_simd_size (t, j, given)))
2208         goto mismatch;
2209
2210       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2211         goto mismatch;
2212     }
2213
2214   return match | MATCH_REVERSE;
2215 }
2216
2217 static INLINE int
2218 operand_type_match (i386_operand_type overlap,
2219                     i386_operand_type given)
2220 {
2221   i386_operand_type temp = overlap;
2222
2223   temp.bitfield.unspecified = 0;
2224   temp.bitfield.byte = 0;
2225   temp.bitfield.word = 0;
2226   temp.bitfield.dword = 0;
2227   temp.bitfield.fword = 0;
2228   temp.bitfield.qword = 0;
2229   temp.bitfield.tbyte = 0;
2230   temp.bitfield.xmmword = 0;
2231   temp.bitfield.ymmword = 0;
2232   temp.bitfield.zmmword = 0;
2233   if (operand_type_all_zero (&temp))
2234     goto mismatch;
2235
2236   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2237     return 1;
2238
2239 mismatch:
2240   i.error = operand_type_mismatch;
2241   return 0;
2242 }
2243
2244 /* If given types g0 and g1 are registers they must be of the same type
2245    unless the expected operand type register overlap is null.
2246    Memory operand size of certain SIMD instructions is also being checked
2247    here.  */
2248
2249 static INLINE int
2250 operand_type_register_match (i386_operand_type g0,
2251                              i386_operand_type t0,
2252                              i386_operand_type g1,
2253                              i386_operand_type t1)
2254 {
2255   if (g0.bitfield.class != Reg
2256       && g0.bitfield.class != RegSIMD
2257       && (!operand_type_check (g0, anymem)
2258           || g0.bitfield.unspecified
2259           || t0.bitfield.class != RegSIMD))
2260     return 1;
2261
2262   if (g1.bitfield.class != Reg
2263       && g1.bitfield.class != RegSIMD
2264       && (!operand_type_check (g1, anymem)
2265           || g1.bitfield.unspecified
2266           || t1.bitfield.class != RegSIMD))
2267     return 1;
2268
2269   if (g0.bitfield.byte == g1.bitfield.byte
2270       && g0.bitfield.word == g1.bitfield.word
2271       && g0.bitfield.dword == g1.bitfield.dword
2272       && g0.bitfield.qword == g1.bitfield.qword
2273       && g0.bitfield.xmmword == g1.bitfield.xmmword
2274       && g0.bitfield.ymmword == g1.bitfield.ymmword
2275       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2276     return 1;
2277
2278   if (!(t0.bitfield.byte & t1.bitfield.byte)
2279       && !(t0.bitfield.word & t1.bitfield.word)
2280       && !(t0.bitfield.dword & t1.bitfield.dword)
2281       && !(t0.bitfield.qword & t1.bitfield.qword)
2282       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2283       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2284       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2285     return 1;
2286
2287   i.error = register_type_mismatch;
2288
2289   return 0;
2290 }
2291
2292 static INLINE unsigned int
2293 register_number (const reg_entry *r)
2294 {
2295   unsigned int nr = r->reg_num;
2296
2297   if (r->reg_flags & RegRex)
2298     nr += 8;
2299
2300   if (r->reg_flags & RegVRex)
2301     nr += 16;
2302
2303   return nr;
2304 }
2305
2306 static INLINE unsigned int
2307 mode_from_disp_size (i386_operand_type t)
2308 {
2309   if (t.bitfield.disp8)
2310     return 1;
2311   else if (t.bitfield.disp16
2312            || t.bitfield.disp32
2313            || t.bitfield.disp32s)
2314     return 2;
2315   else
2316     return 0;
2317 }
2318
2319 static INLINE int
2320 fits_in_signed_byte (addressT num)
2321 {
2322   return num + 0x80 <= 0xff;
2323 }
2324
2325 static INLINE int
2326 fits_in_unsigned_byte (addressT num)
2327 {
2328   return num <= 0xff;
2329 }
2330
2331 static INLINE int
2332 fits_in_unsigned_word (addressT num)
2333 {
2334   return num <= 0xffff;
2335 }
2336
2337 static INLINE int
2338 fits_in_signed_word (addressT num)
2339 {
2340   return num + 0x8000 <= 0xffff;
2341 }
2342
2343 static INLINE int
2344 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2345 {
2346 #ifndef BFD64
2347   return 1;
2348 #else
2349   return num + 0x80000000 <= 0xffffffff;
2350 #endif
2351 }                               /* fits_in_signed_long() */
2352
2353 static INLINE int
2354 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2355 {
2356 #ifndef BFD64
2357   return 1;
2358 #else
2359   return num <= 0xffffffff;
2360 #endif
2361 }                               /* fits_in_unsigned_long() */
2362
2363 static INLINE int
2364 fits_in_disp8 (offsetT num)
2365 {
2366   int shift = i.memshift;
2367   unsigned int mask;
2368
2369   if (shift == -1)
2370     abort ();
2371
2372   mask = (1 << shift) - 1;
2373
2374   /* Return 0 if NUM isn't properly aligned.  */
2375   if ((num & mask))
2376     return 0;
2377
2378   /* Check if NUM will fit in 8bit after shift.  */
2379   return fits_in_signed_byte (num >> shift);
2380 }
2381
2382 static INLINE int
2383 fits_in_imm4 (offsetT num)
2384 {
2385   return (num & 0xf) == num;
2386 }
2387
2388 static i386_operand_type
2389 smallest_imm_type (offsetT num)
2390 {
2391   i386_operand_type t;
2392
2393   operand_type_set (&t, 0);
2394   t.bitfield.imm64 = 1;
2395
2396   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2397     {
2398       /* This code is disabled on the 486 because all the Imm1 forms
2399          in the opcode table are slower on the i486.  They're the
2400          versions with the implicitly specified single-position
2401          displacement, which has another syntax if you really want to
2402          use that form.  */
2403       t.bitfield.imm1 = 1;
2404       t.bitfield.imm8 = 1;
2405       t.bitfield.imm8s = 1;
2406       t.bitfield.imm16 = 1;
2407       t.bitfield.imm32 = 1;
2408       t.bitfield.imm32s = 1;
2409     }
2410   else if (fits_in_signed_byte (num))
2411     {
2412       t.bitfield.imm8 = 1;
2413       t.bitfield.imm8s = 1;
2414       t.bitfield.imm16 = 1;
2415       t.bitfield.imm32 = 1;
2416       t.bitfield.imm32s = 1;
2417     }
2418   else if (fits_in_unsigned_byte (num))
2419     {
2420       t.bitfield.imm8 = 1;
2421       t.bitfield.imm16 = 1;
2422       t.bitfield.imm32 = 1;
2423       t.bitfield.imm32s = 1;
2424     }
2425   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2426     {
2427       t.bitfield.imm16 = 1;
2428       t.bitfield.imm32 = 1;
2429       t.bitfield.imm32s = 1;
2430     }
2431   else if (fits_in_signed_long (num))
2432     {
2433       t.bitfield.imm32 = 1;
2434       t.bitfield.imm32s = 1;
2435     }
2436   else if (fits_in_unsigned_long (num))
2437     t.bitfield.imm32 = 1;
2438
2439   return t;
2440 }
2441
2442 static offsetT
2443 offset_in_range (offsetT val, int size)
2444 {
2445   addressT mask;
2446
2447   switch (size)
2448     {
2449     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2450     case 2: mask = ((addressT) 1 << 16) - 1; break;
2451     case 4: mask = ((addressT) 2 << 31) - 1; break;
2452 #ifdef BFD64
2453     case 8: mask = ((addressT) 2 << 63) - 1; break;
2454 #endif
2455     default: abort ();
2456     }
2457
2458 #ifdef BFD64
2459   /* If BFD64, sign extend val for 32bit address mode.  */
2460   if (flag_code != CODE_64BIT
2461       || i.prefix[ADDR_PREFIX])
2462     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2463       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2464 #endif
2465
2466   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2467     {
2468       char buf1[40], buf2[40];
2469
2470       sprint_value (buf1, val);
2471       sprint_value (buf2, val & mask);
2472       as_warn (_("%s shortened to %s"), buf1, buf2);
2473     }
2474   return val & mask;
2475 }
2476
2477 enum PREFIX_GROUP
2478 {
2479   PREFIX_EXIST = 0,
2480   PREFIX_LOCK,
2481   PREFIX_REP,
2482   PREFIX_DS,
2483   PREFIX_OTHER
2484 };
2485
2486 /* Returns
2487    a. PREFIX_EXIST if attempting to add a prefix where one from the
2488    same class already exists.
2489    b. PREFIX_LOCK if lock prefix is added.
2490    c. PREFIX_REP if rep/repne prefix is added.
2491    d. PREFIX_DS if ds prefix is added.
2492    e. PREFIX_OTHER if other prefix is added.
2493  */
2494
2495 static enum PREFIX_GROUP
2496 add_prefix (unsigned int prefix)
2497 {
2498   enum PREFIX_GROUP ret = PREFIX_OTHER;
2499   unsigned int q;
2500
2501   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2502       && flag_code == CODE_64BIT)
2503     {
2504       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2505           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2506           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2507           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2508         ret = PREFIX_EXIST;
2509       q = REX_PREFIX;
2510     }
2511   else
2512     {
2513       switch (prefix)
2514         {
2515         default:
2516           abort ();
2517
2518         case DS_PREFIX_OPCODE:
2519           ret = PREFIX_DS;
2520           /* Fall through.  */
2521         case CS_PREFIX_OPCODE:
2522         case ES_PREFIX_OPCODE:
2523         case FS_PREFIX_OPCODE:
2524         case GS_PREFIX_OPCODE:
2525         case SS_PREFIX_OPCODE:
2526           q = SEG_PREFIX;
2527           break;
2528
2529         case REPNE_PREFIX_OPCODE:
2530         case REPE_PREFIX_OPCODE:
2531           q = REP_PREFIX;
2532           ret = PREFIX_REP;
2533           break;
2534
2535         case LOCK_PREFIX_OPCODE:
2536           q = LOCK_PREFIX;
2537           ret = PREFIX_LOCK;
2538           break;
2539
2540         case FWAIT_OPCODE:
2541           q = WAIT_PREFIX;
2542           break;
2543
2544         case ADDR_PREFIX_OPCODE:
2545           q = ADDR_PREFIX;
2546           break;
2547
2548         case DATA_PREFIX_OPCODE:
2549           q = DATA_PREFIX;
2550           break;
2551         }
2552       if (i.prefix[q] != 0)
2553         ret = PREFIX_EXIST;
2554     }
2555
2556   if (ret)
2557     {
2558       if (!i.prefix[q])
2559         ++i.prefixes;
2560       i.prefix[q] |= prefix;
2561     }
2562   else
2563     as_bad (_("same type of prefix used twice"));
2564
2565   return ret;
2566 }
2567
2568 static void
2569 update_code_flag (int value, int check)
2570 {
2571   PRINTF_LIKE ((*as_error));
2572
2573   flag_code = (enum flag_code) value;
2574   if (flag_code == CODE_64BIT)
2575     {
2576       cpu_arch_flags.bitfield.cpu64 = 1;
2577       cpu_arch_flags.bitfield.cpuno64 = 0;
2578     }
2579   else
2580     {
2581       cpu_arch_flags.bitfield.cpu64 = 0;
2582       cpu_arch_flags.bitfield.cpuno64 = 1;
2583     }
2584   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2585     {
2586       if (check)
2587         as_error = as_fatal;
2588       else
2589         as_error = as_bad;
2590       (*as_error) (_("64bit mode not supported on `%s'."),
2591                    cpu_arch_name ? cpu_arch_name : default_arch);
2592     }
2593   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2594     {
2595       if (check)
2596         as_error = as_fatal;
2597       else
2598         as_error = as_bad;
2599       (*as_error) (_("32bit mode not supported on `%s'."),
2600                    cpu_arch_name ? cpu_arch_name : default_arch);
2601     }
2602   stackop_size = '\0';
2603 }
2604
2605 static void
2606 set_code_flag (int value)
2607 {
2608   update_code_flag (value, 0);
2609 }
2610
2611 static void
2612 set_16bit_gcc_code_flag (int new_code_flag)
2613 {
2614   flag_code = (enum flag_code) new_code_flag;
2615   if (flag_code != CODE_16BIT)
2616     abort ();
2617   cpu_arch_flags.bitfield.cpu64 = 0;
2618   cpu_arch_flags.bitfield.cpuno64 = 1;
2619   stackop_size = LONG_MNEM_SUFFIX;
2620 }
2621
2622 static void
2623 set_intel_syntax (int syntax_flag)
2624 {
2625   /* Find out if register prefixing is specified.  */
2626   int ask_naked_reg = 0;
2627
2628   SKIP_WHITESPACE ();
2629   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2630     {
2631       char *string;
2632       int e = get_symbol_name (&string);
2633
2634       if (strcmp (string, "prefix") == 0)
2635         ask_naked_reg = 1;
2636       else if (strcmp (string, "noprefix") == 0)
2637         ask_naked_reg = -1;
2638       else
2639         as_bad (_("bad argument to syntax directive."));
2640       (void) restore_line_pointer (e);
2641     }
2642   demand_empty_rest_of_line ();
2643
2644   intel_syntax = syntax_flag;
2645
2646   if (ask_naked_reg == 0)
2647     allow_naked_reg = (intel_syntax
2648                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2649   else
2650     allow_naked_reg = (ask_naked_reg < 0);
2651
2652   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2653
2654   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2655   identifier_chars['$'] = intel_syntax ? '$' : 0;
2656   register_prefix = allow_naked_reg ? "" : "%";
2657 }
2658
2659 static void
2660 set_intel_mnemonic (int mnemonic_flag)
2661 {
2662   intel_mnemonic = mnemonic_flag;
2663 }
2664
2665 static void
2666 set_allow_index_reg (int flag)
2667 {
2668   allow_index_reg = flag;
2669 }
2670
2671 static void
2672 set_check (int what)
2673 {
2674   enum check_kind *kind;
2675   const char *str;
2676
2677   if (what)
2678     {
2679       kind = &operand_check;
2680       str = "operand";
2681     }
2682   else
2683     {
2684       kind = &sse_check;
2685       str = "sse";
2686     }
2687
2688   SKIP_WHITESPACE ();
2689
2690   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2691     {
2692       char *string;
2693       int e = get_symbol_name (&string);
2694
2695       if (strcmp (string, "none") == 0)
2696         *kind = check_none;
2697       else if (strcmp (string, "warning") == 0)
2698         *kind = check_warning;
2699       else if (strcmp (string, "error") == 0)
2700         *kind = check_error;
2701       else
2702         as_bad (_("bad argument to %s_check directive."), str);
2703       (void) restore_line_pointer (e);
2704     }
2705   else
2706     as_bad (_("missing argument for %s_check directive"), str);
2707
2708   demand_empty_rest_of_line ();
2709 }
2710
2711 static void
2712 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2713                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2714 {
2715 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2716   static const char *arch;
2717
2718   /* Intel LIOM is only supported on ELF.  */
2719   if (!IS_ELF)
2720     return;
2721
2722   if (!arch)
2723     {
2724       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2725          use default_arch.  */
2726       arch = cpu_arch_name;
2727       if (!arch)
2728         arch = default_arch;
2729     }
2730
2731   /* If we are targeting Intel MCU, we must enable it.  */
2732   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2733       || new_flag.bitfield.cpuiamcu)
2734     return;
2735
2736   /* If we are targeting Intel L1OM, we must enable it.  */
2737   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2738       || new_flag.bitfield.cpul1om)
2739     return;
2740
2741   /* If we are targeting Intel K1OM, we must enable it.  */
2742   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2743       || new_flag.bitfield.cpuk1om)
2744     return;
2745
2746   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2747 #endif
2748 }
2749
2750 static void
2751 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2752 {
2753   SKIP_WHITESPACE ();
2754
2755   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2756     {
2757       char *string;
2758       int e = get_symbol_name (&string);
2759       unsigned int j;
2760       i386_cpu_flags flags;
2761
2762       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2763         {
2764           if (strcmp (string, cpu_arch[j].name) == 0)
2765             {
2766               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2767
2768               if (*string != '.')
2769                 {
2770                   cpu_arch_name = cpu_arch[j].name;
2771                   cpu_sub_arch_name = NULL;
2772                   cpu_arch_flags = cpu_arch[j].flags;
2773                   if (flag_code == CODE_64BIT)
2774                     {
2775                       cpu_arch_flags.bitfield.cpu64 = 1;
2776                       cpu_arch_flags.bitfield.cpuno64 = 0;
2777                     }
2778                   else
2779                     {
2780                       cpu_arch_flags.bitfield.cpu64 = 0;
2781                       cpu_arch_flags.bitfield.cpuno64 = 1;
2782                     }
2783                   cpu_arch_isa = cpu_arch[j].type;
2784                   cpu_arch_isa_flags = cpu_arch[j].flags;
2785                   if (!cpu_arch_tune_set)
2786                     {
2787                       cpu_arch_tune = cpu_arch_isa;
2788                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2789                     }
2790                   break;
2791                 }
2792
2793               flags = cpu_flags_or (cpu_arch_flags,
2794                                     cpu_arch[j].flags);
2795
2796               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2797                 {
2798                   if (cpu_sub_arch_name)
2799                     {
2800                       char *name = cpu_sub_arch_name;
2801                       cpu_sub_arch_name = concat (name,
2802                                                   cpu_arch[j].name,
2803                                                   (const char *) NULL);
2804                       free (name);
2805                     }
2806                   else
2807                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2808                   cpu_arch_flags = flags;
2809                   cpu_arch_isa_flags = flags;
2810                 }
2811               else
2812                 cpu_arch_isa_flags
2813                   = cpu_flags_or (cpu_arch_isa_flags,
2814                                   cpu_arch[j].flags);
2815               (void) restore_line_pointer (e);
2816               demand_empty_rest_of_line ();
2817               return;
2818             }
2819         }
2820
2821       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2822         {
2823           /* Disable an ISA extension.  */
2824           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2825             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2826               {
2827                 flags = cpu_flags_and_not (cpu_arch_flags,
2828                                            cpu_noarch[j].flags);
2829                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2830                   {
2831                     if (cpu_sub_arch_name)
2832                       {
2833                         char *name = cpu_sub_arch_name;
2834                         cpu_sub_arch_name = concat (name, string,
2835                                                     (const char *) NULL);
2836                         free (name);
2837                       }
2838                     else
2839                       cpu_sub_arch_name = xstrdup (string);
2840                     cpu_arch_flags = flags;
2841                     cpu_arch_isa_flags = flags;
2842                   }
2843                 (void) restore_line_pointer (e);
2844                 demand_empty_rest_of_line ();
2845                 return;
2846               }
2847
2848           j = ARRAY_SIZE (cpu_arch);
2849         }
2850
2851       if (j >= ARRAY_SIZE (cpu_arch))
2852         as_bad (_("no such architecture: `%s'"), string);
2853
2854       *input_line_pointer = e;
2855     }
2856   else
2857     as_bad (_("missing cpu architecture"));
2858
2859   no_cond_jump_promotion = 0;
2860   if (*input_line_pointer == ','
2861       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2862     {
2863       char *string;
2864       char e;
2865
2866       ++input_line_pointer;
2867       e = get_symbol_name (&string);
2868
2869       if (strcmp (string, "nojumps") == 0)
2870         no_cond_jump_promotion = 1;
2871       else if (strcmp (string, "jumps") == 0)
2872         ;
2873       else
2874         as_bad (_("no such architecture modifier: `%s'"), string);
2875
2876       (void) restore_line_pointer (e);
2877     }
2878
2879   demand_empty_rest_of_line ();
2880 }
2881
2882 enum bfd_architecture
2883 i386_arch (void)
2884 {
2885   if (cpu_arch_isa == PROCESSOR_L1OM)
2886     {
2887       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2888           || flag_code != CODE_64BIT)
2889         as_fatal (_("Intel L1OM is 64bit ELF only"));
2890       return bfd_arch_l1om;
2891     }
2892   else if (cpu_arch_isa == PROCESSOR_K1OM)
2893     {
2894       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2895           || flag_code != CODE_64BIT)
2896         as_fatal (_("Intel K1OM is 64bit ELF only"));
2897       return bfd_arch_k1om;
2898     }
2899   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2900     {
2901       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2902           || flag_code == CODE_64BIT)
2903         as_fatal (_("Intel MCU is 32bit ELF only"));
2904       return bfd_arch_iamcu;
2905     }
2906   else
2907     return bfd_arch_i386;
2908 }
2909
2910 unsigned long
2911 i386_mach (void)
2912 {
2913   if (!strncmp (default_arch, "x86_64", 6))
2914     {
2915       if (cpu_arch_isa == PROCESSOR_L1OM)
2916         {
2917           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2918               || default_arch[6] != '\0')
2919             as_fatal (_("Intel L1OM is 64bit ELF only"));
2920           return bfd_mach_l1om;
2921         }
2922       else if (cpu_arch_isa == PROCESSOR_K1OM)
2923         {
2924           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2925               || default_arch[6] != '\0')
2926             as_fatal (_("Intel K1OM is 64bit ELF only"));
2927           return bfd_mach_k1om;
2928         }
2929       else if (default_arch[6] == '\0')
2930         return bfd_mach_x86_64;
2931       else
2932         return bfd_mach_x64_32;
2933     }
2934   else if (!strcmp (default_arch, "i386")
2935            || !strcmp (default_arch, "iamcu"))
2936     {
2937       if (cpu_arch_isa == PROCESSOR_IAMCU)
2938         {
2939           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2940             as_fatal (_("Intel MCU is 32bit ELF only"));
2941           return bfd_mach_i386_iamcu;
2942         }
2943       else
2944         return bfd_mach_i386_i386;
2945     }
2946   else
2947     as_fatal (_("unknown architecture"));
2948 }
2949 \f
2950 void
2951 md_begin (void)
2952 {
2953   const char *hash_err;
2954
2955   /* Support pseudo prefixes like {disp32}.  */
2956   lex_type ['{'] = LEX_BEGIN_NAME;
2957
2958   /* Initialize op_hash hash table.  */
2959   op_hash = hash_new ();
2960
2961   {
2962     const insn_template *optab;
2963     templates *core_optab;
2964
2965     /* Setup for loop.  */
2966     optab = i386_optab;
2967     core_optab = XNEW (templates);
2968     core_optab->start = optab;
2969
2970     while (1)
2971       {
2972         ++optab;
2973         if (optab->name == NULL
2974             || strcmp (optab->name, (optab - 1)->name) != 0)
2975           {
2976             /* different name --> ship out current template list;
2977                add to hash table; & begin anew.  */
2978             core_optab->end = optab;
2979             hash_err = hash_insert (op_hash,
2980                                     (optab - 1)->name,
2981                                     (void *) core_optab);
2982             if (hash_err)
2983               {
2984                 as_fatal (_("can't hash %s: %s"),
2985                           (optab - 1)->name,
2986                           hash_err);
2987               }
2988             if (optab->name == NULL)
2989               break;
2990             core_optab = XNEW (templates);
2991             core_optab->start = optab;
2992           }
2993       }
2994   }
2995
2996   /* Initialize reg_hash hash table.  */
2997   reg_hash = hash_new ();
2998   {
2999     const reg_entry *regtab;
3000     unsigned int regtab_size = i386_regtab_size;
3001
3002     for (regtab = i386_regtab; regtab_size--; regtab++)
3003       {
3004         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3005         if (hash_err)
3006           as_fatal (_("can't hash %s: %s"),
3007                     regtab->reg_name,
3008                     hash_err);
3009       }
3010   }
3011
3012   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3013   {
3014     int c;
3015     char *p;
3016
3017     for (c = 0; c < 256; c++)
3018       {
3019         if (ISDIGIT (c))
3020           {
3021             digit_chars[c] = c;
3022             mnemonic_chars[c] = c;
3023             register_chars[c] = c;
3024             operand_chars[c] = c;
3025           }
3026         else if (ISLOWER (c))
3027           {
3028             mnemonic_chars[c] = c;
3029             register_chars[c] = c;
3030             operand_chars[c] = c;
3031           }
3032         else if (ISUPPER (c))
3033           {
3034             mnemonic_chars[c] = TOLOWER (c);
3035             register_chars[c] = mnemonic_chars[c];
3036             operand_chars[c] = c;
3037           }
3038         else if (c == '{' || c == '}')
3039           {
3040             mnemonic_chars[c] = c;
3041             operand_chars[c] = c;
3042           }
3043
3044         if (ISALPHA (c) || ISDIGIT (c))
3045           identifier_chars[c] = c;
3046         else if (c >= 128)
3047           {
3048             identifier_chars[c] = c;
3049             operand_chars[c] = c;
3050           }
3051       }
3052
3053 #ifdef LEX_AT
3054     identifier_chars['@'] = '@';
3055 #endif
3056 #ifdef LEX_QM
3057     identifier_chars['?'] = '?';
3058     operand_chars['?'] = '?';
3059 #endif
3060     digit_chars['-'] = '-';
3061     mnemonic_chars['_'] = '_';
3062     mnemonic_chars['-'] = '-';
3063     mnemonic_chars['.'] = '.';
3064     identifier_chars['_'] = '_';
3065     identifier_chars['.'] = '.';
3066
3067     for (p = operand_special_chars; *p != '\0'; p++)
3068       operand_chars[(unsigned char) *p] = *p;
3069   }
3070
3071   if (flag_code == CODE_64BIT)
3072     {
3073 #if defined (OBJ_COFF) && defined (TE_PE)
3074       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3075                                   ? 32 : 16);
3076 #else
3077       x86_dwarf2_return_column = 16;
3078 #endif
3079       x86_cie_data_alignment = -8;
3080     }
3081   else
3082     {
3083       x86_dwarf2_return_column = 8;
3084       x86_cie_data_alignment = -4;
3085     }
3086
3087   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3088      can be turned into BRANCH_PREFIX frag.  */
3089   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3090     abort ();
3091 }
3092
3093 void
3094 i386_print_statistics (FILE *file)
3095 {
3096   hash_print_statistics (file, "i386 opcode", op_hash);
3097   hash_print_statistics (file, "i386 register", reg_hash);
3098 }
3099 \f
3100 #ifdef DEBUG386
3101
3102 /* Debugging routines for md_assemble.  */
3103 static void pte (insn_template *);
3104 static void pt (i386_operand_type);
3105 static void pe (expressionS *);
3106 static void ps (symbolS *);
3107
3108 static void
3109 pi (const char *line, i386_insn *x)
3110 {
3111   unsigned int j;
3112
3113   fprintf (stdout, "%s: template ", line);
3114   pte (&x->tm);
3115   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3116            x->base_reg ? x->base_reg->reg_name : "none",
3117            x->index_reg ? x->index_reg->reg_name : "none",
3118            x->log2_scale_factor);
3119   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3120            x->rm.mode, x->rm.reg, x->rm.regmem);
3121   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3122            x->sib.base, x->sib.index, x->sib.scale);
3123   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3124            (x->rex & REX_W) != 0,
3125            (x->rex & REX_R) != 0,
3126            (x->rex & REX_X) != 0,
3127            (x->rex & REX_B) != 0);
3128   for (j = 0; j < x->operands; j++)
3129     {
3130       fprintf (stdout, "    #%d:  ", j + 1);
3131       pt (x->types[j]);
3132       fprintf (stdout, "\n");
3133       if (x->types[j].bitfield.class == Reg
3134           || x->types[j].bitfield.class == RegMMX
3135           || x->types[j].bitfield.class == RegSIMD
3136           || x->types[j].bitfield.class == SReg
3137           || x->types[j].bitfield.class == RegCR
3138           || x->types[j].bitfield.class == RegDR
3139           || x->types[j].bitfield.class == RegTR)
3140         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3141       if (operand_type_check (x->types[j], imm))
3142         pe (x->op[j].imms);
3143       if (operand_type_check (x->types[j], disp))
3144         pe (x->op[j].disps);
3145     }
3146 }
3147
3148 static void
3149 pte (insn_template *t)
3150 {
3151   unsigned int j;
3152   fprintf (stdout, " %d operands ", t->operands);
3153   fprintf (stdout, "opcode %x ", t->base_opcode);
3154   if (t->extension_opcode != None)
3155     fprintf (stdout, "ext %x ", t->extension_opcode);
3156   if (t->opcode_modifier.d)
3157     fprintf (stdout, "D");
3158   if (t->opcode_modifier.w)
3159     fprintf (stdout, "W");
3160   fprintf (stdout, "\n");
3161   for (j = 0; j < t->operands; j++)
3162     {
3163       fprintf (stdout, "    #%d type ", j + 1);
3164       pt (t->operand_types[j]);
3165       fprintf (stdout, "\n");
3166     }
3167 }
3168
3169 static void
3170 pe (expressionS *e)
3171 {
3172   fprintf (stdout, "    operation     %d\n", e->X_op);
3173   fprintf (stdout, "    add_number    %ld (%lx)\n",
3174            (long) e->X_add_number, (long) e->X_add_number);
3175   if (e->X_add_symbol)
3176     {
3177       fprintf (stdout, "    add_symbol    ");
3178       ps (e->X_add_symbol);
3179       fprintf (stdout, "\n");
3180     }
3181   if (e->X_op_symbol)
3182     {
3183       fprintf (stdout, "    op_symbol    ");
3184       ps (e->X_op_symbol);
3185       fprintf (stdout, "\n");
3186     }
3187 }
3188
3189 static void
3190 ps (symbolS *s)
3191 {
3192   fprintf (stdout, "%s type %s%s",
3193            S_GET_NAME (s),
3194            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3195            segment_name (S_GET_SEGMENT (s)));
3196 }
3197
3198 static struct type_name
3199   {
3200     i386_operand_type mask;
3201     const char *name;
3202   }
3203 const type_names[] =
3204 {
3205   { OPERAND_TYPE_REG8, "r8" },
3206   { OPERAND_TYPE_REG16, "r16" },
3207   { OPERAND_TYPE_REG32, "r32" },
3208   { OPERAND_TYPE_REG64, "r64" },
3209   { OPERAND_TYPE_ACC8, "acc8" },
3210   { OPERAND_TYPE_ACC16, "acc16" },
3211   { OPERAND_TYPE_ACC32, "acc32" },
3212   { OPERAND_TYPE_ACC64, "acc64" },
3213   { OPERAND_TYPE_IMM8, "i8" },
3214   { OPERAND_TYPE_IMM8, "i8s" },
3215   { OPERAND_TYPE_IMM16, "i16" },
3216   { OPERAND_TYPE_IMM32, "i32" },
3217   { OPERAND_TYPE_IMM32S, "i32s" },
3218   { OPERAND_TYPE_IMM64, "i64" },
3219   { OPERAND_TYPE_IMM1, "i1" },
3220   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3221   { OPERAND_TYPE_DISP8, "d8" },
3222   { OPERAND_TYPE_DISP16, "d16" },
3223   { OPERAND_TYPE_DISP32, "d32" },
3224   { OPERAND_TYPE_DISP32S, "d32s" },
3225   { OPERAND_TYPE_DISP64, "d64" },
3226   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3227   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3228   { OPERAND_TYPE_CONTROL, "control reg" },
3229   { OPERAND_TYPE_TEST, "test reg" },
3230   { OPERAND_TYPE_DEBUG, "debug reg" },
3231   { OPERAND_TYPE_FLOATREG, "FReg" },
3232   { OPERAND_TYPE_FLOATACC, "FAcc" },
3233   { OPERAND_TYPE_SREG, "SReg" },
3234   { OPERAND_TYPE_REGMMX, "rMMX" },
3235   { OPERAND_TYPE_REGXMM, "rXMM" },
3236   { OPERAND_TYPE_REGYMM, "rYMM" },
3237   { OPERAND_TYPE_REGZMM, "rZMM" },
3238   { OPERAND_TYPE_REGMASK, "Mask reg" },
3239 };
3240
3241 static void
3242 pt (i386_operand_type t)
3243 {
3244   unsigned int j;
3245   i386_operand_type a;
3246
3247   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3248     {
3249       a = operand_type_and (t, type_names[j].mask);
3250       if (operand_type_equal (&a, &type_names[j].mask))
3251         fprintf (stdout, "%s, ",  type_names[j].name);
3252     }
3253   fflush (stdout);
3254 }
3255
3256 #endif /* DEBUG386 */
3257 \f
3258 static bfd_reloc_code_real_type
3259 reloc (unsigned int size,
3260        int pcrel,
3261        int sign,
3262        bfd_reloc_code_real_type other)
3263 {
3264   if (other != NO_RELOC)
3265     {
3266       reloc_howto_type *rel;
3267
3268       if (size == 8)
3269         switch (other)
3270           {
3271           case BFD_RELOC_X86_64_GOT32:
3272             return BFD_RELOC_X86_64_GOT64;
3273             break;
3274           case BFD_RELOC_X86_64_GOTPLT64:
3275             return BFD_RELOC_X86_64_GOTPLT64;
3276             break;
3277           case BFD_RELOC_X86_64_PLTOFF64:
3278             return BFD_RELOC_X86_64_PLTOFF64;
3279             break;
3280           case BFD_RELOC_X86_64_GOTPC32:
3281             other = BFD_RELOC_X86_64_GOTPC64;
3282             break;
3283           case BFD_RELOC_X86_64_GOTPCREL:
3284             other = BFD_RELOC_X86_64_GOTPCREL64;
3285             break;
3286           case BFD_RELOC_X86_64_TPOFF32:
3287             other = BFD_RELOC_X86_64_TPOFF64;
3288             break;
3289           case BFD_RELOC_X86_64_DTPOFF32:
3290             other = BFD_RELOC_X86_64_DTPOFF64;
3291             break;
3292           default:
3293             break;
3294           }
3295
3296 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3297       if (other == BFD_RELOC_SIZE32)
3298         {
3299           if (size == 8)
3300             other = BFD_RELOC_SIZE64;
3301           if (pcrel)
3302             {
3303               as_bad (_("there are no pc-relative size relocations"));
3304               return NO_RELOC;
3305             }
3306         }
3307 #endif
3308
3309       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3310       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3311         sign = -1;
3312
3313       rel = bfd_reloc_type_lookup (stdoutput, other);
3314       if (!rel)
3315         as_bad (_("unknown relocation (%u)"), other);
3316       else if (size != bfd_get_reloc_size (rel))
3317         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3318                 bfd_get_reloc_size (rel),
3319                 size);
3320       else if (pcrel && !rel->pc_relative)
3321         as_bad (_("non-pc-relative relocation for pc-relative field"));
3322       else if ((rel->complain_on_overflow == complain_overflow_signed
3323                 && !sign)
3324                || (rel->complain_on_overflow == complain_overflow_unsigned
3325                    && sign > 0))
3326         as_bad (_("relocated field and relocation type differ in signedness"));
3327       else
3328         return other;
3329       return NO_RELOC;
3330     }
3331
3332   if (pcrel)
3333     {
3334       if (!sign)
3335         as_bad (_("there are no unsigned pc-relative relocations"));
3336       switch (size)
3337         {
3338         case 1: return BFD_RELOC_8_PCREL;
3339         case 2: return BFD_RELOC_16_PCREL;
3340         case 4: return BFD_RELOC_32_PCREL;
3341         case 8: return BFD_RELOC_64_PCREL;
3342         }
3343       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3344     }
3345   else
3346     {
3347       if (sign > 0)
3348         switch (size)
3349           {
3350           case 4: return BFD_RELOC_X86_64_32S;
3351           }
3352       else
3353         switch (size)
3354           {
3355           case 1: return BFD_RELOC_8;
3356           case 2: return BFD_RELOC_16;
3357           case 4: return BFD_RELOC_32;
3358           case 8: return BFD_RELOC_64;
3359           }
3360       as_bad (_("cannot do %s %u byte relocation"),
3361               sign > 0 ? "signed" : "unsigned", size);
3362     }
3363
3364   return NO_RELOC;
3365 }
3366
3367 /* Here we decide which fixups can be adjusted to make them relative to
3368    the beginning of the section instead of the symbol.  Basically we need
3369    to make sure that the dynamic relocations are done correctly, so in
3370    some cases we force the original symbol to be used.  */
3371
3372 int
3373 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3374 {
3375 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3376   if (!IS_ELF)
3377     return 1;
3378
3379   /* Don't adjust pc-relative references to merge sections in 64-bit
3380      mode.  */
3381   if (use_rela_relocations
3382       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3383       && fixP->fx_pcrel)
3384     return 0;
3385
3386   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3387      and changed later by validate_fix.  */
3388   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3389       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3390     return 0;
3391
3392   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3393      for size relocations.  */
3394   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3395       || fixP->fx_r_type == BFD_RELOC_SIZE64
3396       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3397       || fixP->fx_r_type == BFD_RELOC_386_PLT32
3398       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3399       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3400       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3401       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3402       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3403       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3404       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3405       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3406       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3407       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3408       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3409       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3410       || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3411       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3412       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3413       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3414       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3415       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3416       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3417       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3418       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3419       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3420       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3421       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3422       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3423       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3424       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3425       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3426       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3427     return 0;
3428 #endif
3429   return 1;
3430 }
3431
3432 static int
3433 intel_float_operand (const char *mnemonic)
3434 {
3435   /* Note that the value returned is meaningful only for opcodes with (memory)
3436      operands, hence the code here is free to improperly handle opcodes that
3437      have no operands (for better performance and smaller code). */
3438
3439   if (mnemonic[0] != 'f')
3440     return 0; /* non-math */
3441
3442   switch (mnemonic[1])
3443     {
3444     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3445        the fs segment override prefix not currently handled because no
3446        call path can make opcodes without operands get here */
3447     case 'i':
3448       return 2 /* integer op */;
3449     case 'l':
3450       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3451         return 3; /* fldcw/fldenv */
3452       break;
3453     case 'n':
3454       if (mnemonic[2] != 'o' /* fnop */)
3455         return 3; /* non-waiting control op */
3456       break;
3457     case 'r':
3458       if (mnemonic[2] == 's')
3459         return 3; /* frstor/frstpm */
3460       break;
3461     case 's':
3462       if (mnemonic[2] == 'a')
3463         return 3; /* fsave */
3464       if (mnemonic[2] == 't')
3465         {
3466           switch (mnemonic[3])
3467             {
3468             case 'c': /* fstcw */
3469             case 'd': /* fstdw */
3470             case 'e': /* fstenv */
3471             case 's': /* fsts[gw] */
3472               return 3;
3473             }
3474         }
3475       break;
3476     case 'x':
3477       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3478         return 0; /* fxsave/fxrstor are not really math ops */
3479       break;
3480     }
3481
3482   return 1;
3483 }
3484
3485 /* Build the VEX prefix.  */
3486
3487 static void
3488 build_vex_prefix (const insn_template *t)
3489 {
3490   unsigned int register_specifier;
3491   unsigned int implied_prefix;
3492   unsigned int vector_length;
3493   unsigned int w;
3494
3495   /* Check register specifier.  */
3496   if (i.vex.register_specifier)
3497     {
3498       register_specifier =
3499         ~register_number (i.vex.register_specifier) & 0xf;
3500       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3501     }
3502   else
3503     register_specifier = 0xf;
3504
3505   /* Use 2-byte VEX prefix by swapping destination and source operand
3506      if there are more than 1 register operand.  */
3507   if (i.reg_operands > 1
3508       && i.vec_encoding != vex_encoding_vex3
3509       && i.dir_encoding == dir_encoding_default
3510       && i.operands == i.reg_operands
3511       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3512       && i.tm.opcode_modifier.vexopcode == VEX0F
3513       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3514       && i.rex == REX_B)
3515     {
3516       unsigned int xchg = i.operands - 1;
3517       union i386_op temp_op;
3518       i386_operand_type temp_type;
3519
3520       temp_type = i.types[xchg];
3521       i.types[xchg] = i.types[0];
3522       i.types[0] = temp_type;
3523       temp_op = i.op[xchg];
3524       i.op[xchg] = i.op[0];
3525       i.op[0] = temp_op;
3526
3527       gas_assert (i.rm.mode == 3);
3528
3529       i.rex = REX_R;
3530       xchg = i.rm.regmem;
3531       i.rm.regmem = i.rm.reg;
3532       i.rm.reg = xchg;
3533
3534       if (i.tm.opcode_modifier.d)
3535         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3536                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3537       else /* Use the next insn.  */
3538         i.tm = t[1];
3539     }
3540
3541   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3542      are no memory operands and at least 3 register ones.  */
3543   if (i.reg_operands >= 3
3544       && i.vec_encoding != vex_encoding_vex3
3545       && i.reg_operands == i.operands - i.imm_operands
3546       && i.tm.opcode_modifier.vex
3547       && i.tm.opcode_modifier.commutative
3548       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3549       && i.rex == REX_B
3550       && i.vex.register_specifier
3551       && !(i.vex.register_specifier->reg_flags & RegRex))
3552     {
3553       unsigned int xchg = i.operands - i.reg_operands;
3554       union i386_op temp_op;
3555       i386_operand_type temp_type;
3556
3557       gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3558       gas_assert (!i.tm.opcode_modifier.sae);
3559       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3560                                       &i.types[i.operands - 3]));
3561       gas_assert (i.rm.mode == 3);
3562
3563       temp_type = i.types[xchg];
3564       i.types[xchg] = i.types[xchg + 1];
3565       i.types[xchg + 1] = temp_type;
3566       temp_op = i.op[xchg];
3567       i.op[xchg] = i.op[xchg + 1];
3568       i.op[xchg + 1] = temp_op;
3569
3570       i.rex = 0;
3571       xchg = i.rm.regmem | 8;
3572       i.rm.regmem = ~register_specifier & 0xf;
3573       gas_assert (!(i.rm.regmem & 8));
3574       i.vex.register_specifier += xchg - i.rm.regmem;
3575       register_specifier = ~xchg & 0xf;
3576     }
3577
3578   if (i.tm.opcode_modifier.vex == VEXScalar)
3579     vector_length = avxscalar;
3580   else if (i.tm.opcode_modifier.vex == VEX256)
3581     vector_length = 1;
3582   else
3583     {
3584       unsigned int op;
3585
3586       /* Determine vector length from the last multi-length vector
3587          operand.  */
3588       vector_length = 0;
3589       for (op = t->operands; op--;)
3590         if (t->operand_types[op].bitfield.xmmword
3591             && t->operand_types[op].bitfield.ymmword
3592             && i.types[op].bitfield.ymmword)
3593           {
3594             vector_length = 1;
3595             break;
3596           }
3597     }
3598
3599   switch ((i.tm.base_opcode >> 8) & 0xff)
3600     {
3601     case 0:
3602       implied_prefix = 0;
3603       break;
3604     case DATA_PREFIX_OPCODE:
3605       implied_prefix = 1;
3606       break;
3607     case REPE_PREFIX_OPCODE:
3608       implied_prefix = 2;
3609       break;
3610     case REPNE_PREFIX_OPCODE:
3611       implied_prefix = 3;
3612       break;
3613     default:
3614       abort ();
3615     }
3616
3617   /* Check the REX.W bit and VEXW.  */
3618   if (i.tm.opcode_modifier.vexw == VEXWIG)
3619     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3620   else if (i.tm.opcode_modifier.vexw)
3621     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3622   else
3623     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3624
3625   /* Use 2-byte VEX prefix if possible.  */
3626   if (w == 0
3627       && i.vec_encoding != vex_encoding_vex3
3628       && i.tm.opcode_modifier.vexopcode == VEX0F
3629       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3630     {
3631       /* 2-byte VEX prefix.  */
3632       unsigned int r;
3633
3634       i.vex.length = 2;
3635       i.vex.bytes[0] = 0xc5;
3636
3637       /* Check the REX.R bit.  */
3638       r = (i.rex & REX_R) ? 0 : 1;
3639       i.vex.bytes[1] = (r << 7
3640                         | register_specifier << 3
3641                         | vector_length << 2
3642                         | implied_prefix);
3643     }
3644   else
3645     {
3646       /* 3-byte VEX prefix.  */
3647       unsigned int m;
3648
3649       i.vex.length = 3;
3650
3651       switch (i.tm.opcode_modifier.vexopcode)
3652         {
3653         case VEX0F:
3654           m = 0x1;
3655           i.vex.bytes[0] = 0xc4;
3656           break;
3657         case VEX0F38:
3658           m = 0x2;
3659           i.vex.bytes[0] = 0xc4;
3660           break;
3661         case VEX0F3A:
3662           m = 0x3;
3663           i.vex.bytes[0] = 0xc4;
3664           break;
3665         case XOP08:
3666           m = 0x8;
3667           i.vex.bytes[0] = 0x8f;
3668           break;
3669         case XOP09:
3670           m = 0x9;
3671           i.vex.bytes[0] = 0x8f;
3672           break;
3673         case XOP0A:
3674           m = 0xa;
3675           i.vex.bytes[0] = 0x8f;
3676           break;
3677         default:
3678           abort ();
3679         }
3680
3681       /* The high 3 bits of the second VEX byte are 1's compliment
3682          of RXB bits from REX.  */
3683       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3684
3685       i.vex.bytes[2] = (w << 7
3686                         | register_specifier << 3
3687                         | vector_length << 2
3688                         | implied_prefix);
3689     }
3690 }
3691
3692 static INLINE bfd_boolean
3693 is_evex_encoding (const insn_template *t)
3694 {
3695   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3696          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3697          || t->opcode_modifier.sae;
3698 }
3699
3700 static INLINE bfd_boolean
3701 is_any_vex_encoding (const insn_template *t)
3702 {
3703   return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3704          || is_evex_encoding (t);
3705 }
3706
3707 /* Build the EVEX prefix.  */
3708
3709 static void
3710 build_evex_prefix (void)
3711 {
3712   unsigned int register_specifier;
3713   unsigned int implied_prefix;
3714   unsigned int m, w;
3715   rex_byte vrex_used = 0;
3716
3717   /* Check register specifier.  */
3718   if (i.vex.register_specifier)
3719     {
3720       gas_assert ((i.vrex & REX_X) == 0);
3721
3722       register_specifier = i.vex.register_specifier->reg_num;
3723       if ((i.vex.register_specifier->reg_flags & RegRex))
3724         register_specifier += 8;
3725       /* The upper 16 registers are encoded in the fourth byte of the
3726          EVEX prefix.  */
3727       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3728         i.vex.bytes[3] = 0x8;
3729       register_specifier = ~register_specifier & 0xf;
3730     }
3731   else
3732     {
3733       register_specifier = 0xf;
3734
3735       /* Encode upper 16 vector index register in the fourth byte of
3736          the EVEX prefix.  */
3737       if (!(i.vrex & REX_X))
3738         i.vex.bytes[3] = 0x8;
3739       else
3740         vrex_used |= REX_X;
3741     }
3742
3743   switch ((i.tm.base_opcode >> 8) & 0xff)
3744     {
3745     case 0:
3746       implied_prefix = 0;
3747       break;
3748     case DATA_PREFIX_OPCODE:
3749       implied_prefix = 1;
3750       break;
3751     case REPE_PREFIX_OPCODE:
3752       implied_prefix = 2;
3753       break;
3754     case REPNE_PREFIX_OPCODE:
3755       implied_prefix = 3;
3756       break;
3757     default:
3758       abort ();
3759     }
3760
3761   /* 4 byte EVEX prefix.  */
3762   i.vex.length = 4;
3763   i.vex.bytes[0] = 0x62;
3764
3765   /* mmmm bits.  */
3766   switch (i.tm.opcode_modifier.vexopcode)
3767     {
3768     case VEX0F:
3769       m = 1;
3770       break;
3771     case VEX0F38:
3772       m = 2;
3773       break;
3774     case VEX0F3A:
3775       m = 3;
3776       break;
3777     default:
3778       abort ();
3779       break;
3780     }
3781
3782   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3783      bits from REX.  */
3784   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3785
3786   /* The fifth bit of the second EVEX byte is 1's compliment of the
3787      REX_R bit in VREX.  */
3788   if (!(i.vrex & REX_R))
3789     i.vex.bytes[1] |= 0x10;
3790   else
3791     vrex_used |= REX_R;
3792
3793   if ((i.reg_operands + i.imm_operands) == i.operands)
3794     {
3795       /* When all operands are registers, the REX_X bit in REX is not
3796          used.  We reuse it to encode the upper 16 registers, which is
3797          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3798          as 1's compliment.  */
3799       if ((i.vrex & REX_B))
3800         {
3801           vrex_used |= REX_B;
3802           i.vex.bytes[1] &= ~0x40;
3803         }
3804     }
3805
3806   /* EVEX instructions shouldn't need the REX prefix.  */
3807   i.vrex &= ~vrex_used;
3808   gas_assert (i.vrex == 0);
3809
3810   /* Check the REX.W bit and VEXW.  */
3811   if (i.tm.opcode_modifier.vexw == VEXWIG)
3812     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3813   else if (i.tm.opcode_modifier.vexw)
3814     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3815   else
3816     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3817
3818   /* Encode the U bit.  */
3819   implied_prefix |= 0x4;
3820
3821   /* The third byte of the EVEX prefix.  */
3822   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3823
3824   /* The fourth byte of the EVEX prefix.  */
3825   /* The zeroing-masking bit.  */
3826   if (i.mask && i.mask->zeroing)
3827     i.vex.bytes[3] |= 0x80;
3828
3829   /* Don't always set the broadcast bit if there is no RC.  */
3830   if (!i.rounding)
3831     {
3832       /* Encode the vector length.  */
3833       unsigned int vec_length;
3834
3835       if (!i.tm.opcode_modifier.evex
3836           || i.tm.opcode_modifier.evex == EVEXDYN)
3837         {
3838           unsigned int op;
3839
3840           /* Determine vector length from the last multi-length vector
3841              operand.  */
3842           vec_length = 0;
3843           for (op = i.operands; op--;)
3844             if (i.tm.operand_types[op].bitfield.xmmword
3845                 + i.tm.operand_types[op].bitfield.ymmword
3846                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3847               {
3848                 if (i.types[op].bitfield.zmmword)
3849                   {
3850                     i.tm.opcode_modifier.evex = EVEX512;
3851                     break;
3852                   }
3853                 else if (i.types[op].bitfield.ymmword)
3854                   {
3855                     i.tm.opcode_modifier.evex = EVEX256;
3856                     break;
3857                   }
3858                 else if (i.types[op].bitfield.xmmword)
3859                   {
3860                     i.tm.opcode_modifier.evex = EVEX128;
3861                     break;
3862                   }
3863                 else if (i.broadcast && (int) op == i.broadcast->operand)
3864                   {
3865                     switch (i.broadcast->bytes)
3866                       {
3867                         case 64:
3868                           i.tm.opcode_modifier.evex = EVEX512;
3869                           break;
3870                         case 32:
3871                           i.tm.opcode_modifier.evex = EVEX256;
3872                           break;
3873                         case 16:
3874                           i.tm.opcode_modifier.evex = EVEX128;
3875                           break;
3876                         default:
3877                           abort ();
3878                       }
3879                     break;
3880                   }
3881               }
3882
3883           if (op >= MAX_OPERANDS)
3884             abort ();
3885         }
3886
3887       switch (i.tm.opcode_modifier.evex)
3888         {
3889         case EVEXLIG: /* LL' is ignored */
3890           vec_length = evexlig << 5;
3891           break;
3892         case EVEX128:
3893           vec_length = 0 << 5;
3894           break;
3895         case EVEX256:
3896           vec_length = 1 << 5;
3897           break;
3898         case EVEX512:
3899           vec_length = 2 << 5;
3900           break;
3901         default:
3902           abort ();
3903           break;
3904         }
3905       i.vex.bytes[3] |= vec_length;
3906       /* Encode the broadcast bit.  */
3907       if (i.broadcast)
3908         i.vex.bytes[3] |= 0x10;
3909     }
3910   else
3911     {
3912       if (i.rounding->type != saeonly)
3913         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3914       else
3915         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3916     }
3917
3918   if (i.mask && i.mask->mask)
3919     i.vex.bytes[3] |= i.mask->mask->reg_num;
3920 }
3921
3922 static void
3923 process_immext (void)
3924 {
3925   expressionS *exp;
3926
3927   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3928      which is coded in the same place as an 8-bit immediate field
3929      would be.  Here we fake an 8-bit immediate operand from the
3930      opcode suffix stored in tm.extension_opcode.
3931
3932      AVX instructions also use this encoding, for some of
3933      3 argument instructions.  */
3934
3935   gas_assert (i.imm_operands <= 1
3936               && (i.operands <= 2
3937                   || (is_any_vex_encoding (&i.tm)
3938                       && i.operands <= 4)));
3939
3940   exp = &im_expressions[i.imm_operands++];
3941   i.op[i.operands].imms = exp;
3942   i.types[i.operands] = imm8;
3943   i.operands++;
3944   exp->X_op = O_constant;
3945   exp->X_add_number = i.tm.extension_opcode;
3946   i.tm.extension_opcode = None;
3947 }
3948
3949
3950 static int
3951 check_hle (void)
3952 {
3953   switch (i.tm.opcode_modifier.hleprefixok)
3954     {
3955     default:
3956       abort ();
3957     case HLEPrefixNone:
3958       as_bad (_("invalid instruction `%s' after `%s'"),
3959               i.tm.name, i.hle_prefix);
3960       return 0;
3961     case HLEPrefixLock:
3962       if (i.prefix[LOCK_PREFIX])
3963         return 1;
3964       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3965       return 0;
3966     case HLEPrefixAny:
3967       return 1;
3968     case HLEPrefixRelease:
3969       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3970         {
3971           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3972                   i.tm.name);
3973           return 0;
3974         }
3975       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3976         {
3977           as_bad (_("memory destination needed for instruction `%s'"
3978                     " after `xrelease'"), i.tm.name);
3979           return 0;
3980         }
3981       return 1;
3982     }
3983 }
3984
3985 /* Try the shortest encoding by shortening operand size.  */
3986
3987 static void
3988 optimize_encoding (void)
3989 {
3990   unsigned int j;
3991
3992   if (optimize_for_space
3993       && !is_any_vex_encoding (&i.tm)
3994       && i.reg_operands == 1
3995       && i.imm_operands == 1
3996       && !i.types[1].bitfield.byte
3997       && i.op[0].imms->X_op == O_constant
3998       && fits_in_imm7 (i.op[0].imms->X_add_number)
3999       && (i.tm.base_opcode == 0xa8
4000           || (i.tm.base_opcode == 0xf6
4001               && i.tm.extension_opcode == 0x0)))
4002     {
4003       /* Optimize: -Os:
4004            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4005        */
4006       unsigned int base_regnum = i.op[1].regs->reg_num;
4007       if (flag_code == CODE_64BIT || base_regnum < 4)
4008         {
4009           i.types[1].bitfield.byte = 1;
4010           /* Ignore the suffix.  */
4011           i.suffix = 0;
4012           /* Convert to byte registers.  */
4013           if (i.types[1].bitfield.word)
4014             j = 16;
4015           else if (i.types[1].bitfield.dword)
4016             j = 32;
4017           else
4018             j = 48;
4019           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4020             j += 8;
4021           i.op[1].regs -= j;
4022         }
4023     }
4024   else if (flag_code == CODE_64BIT
4025            && !is_any_vex_encoding (&i.tm)
4026            && ((i.types[1].bitfield.qword
4027                 && i.reg_operands == 1
4028                 && i.imm_operands == 1
4029                 && i.op[0].imms->X_op == O_constant
4030                 && ((i.tm.base_opcode == 0xb8
4031                      && i.tm.extension_opcode == None
4032                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4033                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4034                         && ((i.tm.base_opcode == 0x24
4035                              || i.tm.base_opcode == 0xa8)
4036                             || (i.tm.base_opcode == 0x80
4037                                 && i.tm.extension_opcode == 0x4)
4038                             || ((i.tm.base_opcode == 0xf6
4039                                  || (i.tm.base_opcode | 1) == 0xc7)
4040                                 && i.tm.extension_opcode == 0x0)))
4041                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4042                         && i.tm.base_opcode == 0x83
4043                         && i.tm.extension_opcode == 0x4)))
4044                || (i.types[0].bitfield.qword
4045                    && ((i.reg_operands == 2
4046                         && i.op[0].regs == i.op[1].regs
4047                         && (i.tm.base_opcode == 0x30
4048                             || i.tm.base_opcode == 0x28))
4049                        || (i.reg_operands == 1
4050                            && i.operands == 1
4051                            && i.tm.base_opcode == 0x30)))))
4052     {
4053       /* Optimize: -O:
4054            andq $imm31, %r64   -> andl $imm31, %r32
4055            andq $imm7, %r64    -> andl $imm7, %r32
4056            testq $imm31, %r64  -> testl $imm31, %r32
4057            xorq %r64, %r64     -> xorl %r32, %r32
4058            subq %r64, %r64     -> subl %r32, %r32
4059            movq $imm31, %r64   -> movl $imm31, %r32
4060            movq $imm32, %r64   -> movl $imm32, %r32
4061         */
4062       i.tm.opcode_modifier.norex64 = 1;
4063       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4064         {
4065           /* Handle
4066                movq $imm31, %r64   -> movl $imm31, %r32
4067                movq $imm32, %r64   -> movl $imm32, %r32
4068            */
4069           i.tm.operand_types[0].bitfield.imm32 = 1;
4070           i.tm.operand_types[0].bitfield.imm32s = 0;
4071           i.tm.operand_types[0].bitfield.imm64 = 0;
4072           i.types[0].bitfield.imm32 = 1;
4073           i.types[0].bitfield.imm32s = 0;
4074           i.types[0].bitfield.imm64 = 0;
4075           i.types[1].bitfield.dword = 1;
4076           i.types[1].bitfield.qword = 0;
4077           if ((i.tm.base_opcode | 1) == 0xc7)
4078             {
4079               /* Handle
4080                    movq $imm31, %r64   -> movl $imm31, %r32
4081                */
4082               i.tm.base_opcode = 0xb8;
4083               i.tm.extension_opcode = None;
4084               i.tm.opcode_modifier.w = 0;
4085               i.tm.opcode_modifier.shortform = 1;
4086               i.tm.opcode_modifier.modrm = 0;
4087             }
4088         }
4089     }
4090   else if (optimize > 1
4091            && !optimize_for_space
4092            && !is_any_vex_encoding (&i.tm)
4093            && i.reg_operands == 2
4094            && i.op[0].regs == i.op[1].regs
4095            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4096                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4097            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4098     {
4099       /* Optimize: -O2:
4100            andb %rN, %rN  -> testb %rN, %rN
4101            andw %rN, %rN  -> testw %rN, %rN
4102            andq %rN, %rN  -> testq %rN, %rN
4103            orb %rN, %rN   -> testb %rN, %rN
4104            orw %rN, %rN   -> testw %rN, %rN
4105            orq %rN, %rN   -> testq %rN, %rN
4106
4107            and outside of 64-bit mode
4108
4109            andl %rN, %rN  -> testl %rN, %rN
4110            orl %rN, %rN   -> testl %rN, %rN
4111        */
4112       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4113     }
4114   else if (i.reg_operands == 3
4115            && i.op[0].regs == i.op[1].regs
4116            && !i.types[2].bitfield.xmmword
4117            && (i.tm.opcode_modifier.vex
4118                || ((!i.mask || i.mask->zeroing)
4119                    && !i.rounding
4120                    && is_evex_encoding (&i.tm)
4121                    && (i.vec_encoding != vex_encoding_evex
4122                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4123                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4124                        || (i.tm.operand_types[2].bitfield.zmmword
4125                            && i.types[2].bitfield.ymmword))))
4126            && ((i.tm.base_opcode == 0x55
4127                 || i.tm.base_opcode == 0x6655
4128                 || i.tm.base_opcode == 0x66df
4129                 || i.tm.base_opcode == 0x57
4130                 || i.tm.base_opcode == 0x6657
4131                 || i.tm.base_opcode == 0x66ef
4132                 || i.tm.base_opcode == 0x66f8
4133                 || i.tm.base_opcode == 0x66f9
4134                 || i.tm.base_opcode == 0x66fa
4135                 || i.tm.base_opcode == 0x66fb
4136                 || i.tm.base_opcode == 0x42
4137                 || i.tm.base_opcode == 0x6642
4138                 || i.tm.base_opcode == 0x47
4139                 || i.tm.base_opcode == 0x6647)
4140                && i.tm.extension_opcode == None))
4141     {
4142       /* Optimize: -O1:
4143            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4144            vpsubq and vpsubw:
4145              EVEX VOP %zmmM, %zmmM, %zmmN
4146                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4147                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4148              EVEX VOP %ymmM, %ymmM, %ymmN
4149                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4150                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4151              VEX VOP %ymmM, %ymmM, %ymmN
4152                -> VEX VOP %xmmM, %xmmM, %xmmN
4153            VOP, one of vpandn and vpxor:
4154              VEX VOP %ymmM, %ymmM, %ymmN
4155                -> VEX VOP %xmmM, %xmmM, %xmmN
4156            VOP, one of vpandnd and vpandnq:
4157              EVEX VOP %zmmM, %zmmM, %zmmN
4158                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4159                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4160              EVEX VOP %ymmM, %ymmM, %ymmN
4161                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4162                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4163            VOP, one of vpxord and vpxorq:
4164              EVEX VOP %zmmM, %zmmM, %zmmN
4165                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4166                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4167              EVEX VOP %ymmM, %ymmM, %ymmN
4168                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4169                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4170            VOP, one of kxord and kxorq:
4171              VEX VOP %kM, %kM, %kN
4172                -> VEX kxorw %kM, %kM, %kN
4173            VOP, one of kandnd and kandnq:
4174              VEX VOP %kM, %kM, %kN
4175                -> VEX kandnw %kM, %kM, %kN
4176        */
4177       if (is_evex_encoding (&i.tm))
4178         {
4179           if (i.vec_encoding != vex_encoding_evex)
4180             {
4181               i.tm.opcode_modifier.vex = VEX128;
4182               i.tm.opcode_modifier.vexw = VEXW0;
4183               i.tm.opcode_modifier.evex = 0;
4184             }
4185           else if (optimize > 1)
4186             i.tm.opcode_modifier.evex = EVEX128;
4187           else
4188             return;
4189         }
4190       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4191         {
4192           i.tm.base_opcode &= 0xff;
4193           i.tm.opcode_modifier.vexw = VEXW0;
4194         }
4195       else
4196         i.tm.opcode_modifier.vex = VEX128;
4197
4198       if (i.tm.opcode_modifier.vex)
4199         for (j = 0; j < 3; j++)
4200           {
4201             i.types[j].bitfield.xmmword = 1;
4202             i.types[j].bitfield.ymmword = 0;
4203           }
4204     }
4205   else if (i.vec_encoding != vex_encoding_evex
4206            && !i.types[0].bitfield.zmmword
4207            && !i.types[1].bitfield.zmmword
4208            && !i.mask
4209            && !i.broadcast
4210            && is_evex_encoding (&i.tm)
4211            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4212                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4213                || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4214                || (i.tm.base_opcode & ~4) == 0x66db
4215                || (i.tm.base_opcode & ~4) == 0x66eb)
4216            && i.tm.extension_opcode == None)
4217     {
4218       /* Optimize: -O1:
4219            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4220            vmovdqu32 and vmovdqu64:
4221              EVEX VOP %xmmM, %xmmN
4222                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4223              EVEX VOP %ymmM, %ymmN
4224                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4225              EVEX VOP %xmmM, mem
4226                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4227              EVEX VOP %ymmM, mem
4228                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4229              EVEX VOP mem, %xmmN
4230                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4231              EVEX VOP mem, %ymmN
4232                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4233            VOP, one of vpand, vpandn, vpor, vpxor:
4234              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4235                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4236              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4237                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4238              EVEX VOP{d,q} mem, %xmmM, %xmmN
4239                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4240              EVEX VOP{d,q} mem, %ymmM, %ymmN
4241                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4242        */
4243       for (j = 0; j < i.operands; j++)
4244         if (operand_type_check (i.types[j], disp)
4245             && i.op[j].disps->X_op == O_constant)
4246           {
4247             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4248                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4249                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4250             int evex_disp8, vex_disp8;
4251             unsigned int memshift = i.memshift;
4252             offsetT n = i.op[j].disps->X_add_number;
4253
4254             evex_disp8 = fits_in_disp8 (n);
4255             i.memshift = 0;
4256             vex_disp8 = fits_in_disp8 (n);
4257             if (evex_disp8 != vex_disp8)
4258               {
4259                 i.memshift = memshift;
4260                 return;
4261               }
4262
4263             i.types[j].bitfield.disp8 = vex_disp8;
4264             break;
4265           }
4266       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4267         i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4268       i.tm.opcode_modifier.vex
4269         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4270       i.tm.opcode_modifier.vexw = VEXW0;
4271       /* VPAND, VPOR, and VPXOR are commutative.  */
4272       if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4273         i.tm.opcode_modifier.commutative = 1;
4274       i.tm.opcode_modifier.evex = 0;
4275       i.tm.opcode_modifier.masking = 0;
4276       i.tm.opcode_modifier.broadcast = 0;
4277       i.tm.opcode_modifier.disp8memshift = 0;
4278       i.memshift = 0;
4279       if (j < i.operands)
4280         i.types[j].bitfield.disp8
4281           = fits_in_disp8 (i.op[j].disps->X_add_number);
4282     }
4283 }
4284
4285 /* This is the guts of the machine-dependent assembler.  LINE points to a
4286    machine dependent instruction.  This function is supposed to emit
4287    the frags/bytes it assembles to.  */
4288
4289 void
4290 md_assemble (char *line)
4291 {
4292   unsigned int j;
4293   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4294   const insn_template *t;
4295
4296   /* Initialize globals.  */
4297   memset (&i, '\0', sizeof (i));
4298   for (j = 0; j < MAX_OPERANDS; j++)
4299     i.reloc[j] = NO_RELOC;
4300   memset (disp_expressions, '\0', sizeof (disp_expressions));
4301   memset (im_expressions, '\0', sizeof (im_expressions));
4302   save_stack_p = save_stack;
4303
4304   /* First parse an instruction mnemonic & call i386_operand for the operands.
4305      We assume that the scrubber has arranged it so that line[0] is the valid
4306      start of a (possibly prefixed) mnemonic.  */
4307
4308   line = parse_insn (line, mnemonic);
4309   if (line == NULL)
4310     return;
4311   mnem_suffix = i.suffix;
4312
4313   line = parse_operands (line, mnemonic);
4314   this_operand = -1;
4315   xfree (i.memop1_string);
4316   i.memop1_string = NULL;
4317   if (line == NULL)
4318     return;
4319
4320   /* Now we've parsed the mnemonic into a set of templates, and have the
4321      operands at hand.  */
4322
4323   /* All intel opcodes have reversed operands except for "bound" and
4324      "enter".  We also don't reverse intersegment "jmp" and "call"
4325      instructions with 2 immediate operands so that the immediate segment
4326      precedes the offset, as it does when in AT&T mode. */
4327   if (intel_syntax
4328       && i.operands > 1
4329       && (strcmp (mnemonic, "bound") != 0)
4330       && (strcmp (mnemonic, "invlpga") != 0)
4331       && !(operand_type_check (i.types[0], imm)
4332            && operand_type_check (i.types[1], imm)))
4333     swap_operands ();
4334
4335   /* The order of the immediates should be reversed
4336      for 2 immediates extrq and insertq instructions */
4337   if (i.imm_operands == 2
4338       && (strcmp (mnemonic, "extrq") == 0
4339           || strcmp (mnemonic, "insertq") == 0))
4340       swap_2_operands (0, 1);
4341
4342   if (i.imm_operands)
4343     optimize_imm ();
4344
4345   /* Don't optimize displacement for movabs since it only takes 64bit
4346      displacement.  */
4347   if (i.disp_operands
4348       && i.disp_encoding != disp_encoding_32bit
4349       && (flag_code != CODE_64BIT
4350           || strcmp (mnemonic, "movabs") != 0))
4351     optimize_disp ();
4352
4353   /* Next, we find a template that matches the given insn,
4354      making sure the overlap of the given operands types is consistent
4355      with the template operand types.  */
4356
4357   if (!(t = match_template (mnem_suffix)))
4358     return;
4359
4360   if (sse_check != check_none
4361       && !i.tm.opcode_modifier.noavx
4362       && !i.tm.cpu_flags.bitfield.cpuavx
4363       && !i.tm.cpu_flags.bitfield.cpuavx512f
4364       && (i.tm.cpu_flags.bitfield.cpusse
4365           || i.tm.cpu_flags.bitfield.cpusse2
4366           || i.tm.cpu_flags.bitfield.cpusse3
4367           || i.tm.cpu_flags.bitfield.cpussse3
4368           || i.tm.cpu_flags.bitfield.cpusse4_1
4369           || i.tm.cpu_flags.bitfield.cpusse4_2
4370           || i.tm.cpu_flags.bitfield.cpusse4a
4371           || i.tm.cpu_flags.bitfield.cpupclmul
4372           || i.tm.cpu_flags.bitfield.cpuaes
4373           || i.tm.cpu_flags.bitfield.cpusha
4374           || i.tm.cpu_flags.bitfield.cpugfni))
4375     {
4376       (sse_check == check_warning
4377        ? as_warn
4378        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4379     }
4380
4381   /* Zap movzx and movsx suffix.  The suffix has been set from
4382      "word ptr" or "byte ptr" on the source operand in Intel syntax
4383      or extracted from mnemonic in AT&T syntax.  But we'll use
4384      the destination register to choose the suffix for encoding.  */
4385   if ((i.tm.base_opcode & ~9) == 0x0fb6)
4386     {
4387       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
4388          there is no suffix, the default will be byte extension.  */
4389       if (i.reg_operands != 2
4390           && !i.suffix
4391           && intel_syntax)
4392         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4393
4394       i.suffix = 0;
4395     }
4396
4397   if (i.tm.opcode_modifier.fwait)
4398     if (!add_prefix (FWAIT_OPCODE))
4399       return;
4400
4401   /* Check if REP prefix is OK.  */
4402   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4403     {
4404       as_bad (_("invalid instruction `%s' after `%s'"),
4405                 i.tm.name, i.rep_prefix);
4406       return;
4407     }
4408
4409   /* Check for lock without a lockable instruction.  Destination operand
4410      must be memory unless it is xchg (0x86).  */
4411   if (i.prefix[LOCK_PREFIX]
4412       && (!i.tm.opcode_modifier.islockable
4413           || i.mem_operands == 0
4414           || (i.tm.base_opcode != 0x86
4415               && !(i.flags[i.operands - 1] & Operand_Mem))))
4416     {
4417       as_bad (_("expecting lockable instruction after `lock'"));
4418       return;
4419     }
4420
4421   /* Check for data size prefix on VEX/XOP/EVEX encoded insns.  */
4422   if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4423     {
4424       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4425       return;
4426     }
4427
4428   /* Check if HLE prefix is OK.  */
4429   if (i.hle_prefix && !check_hle ())
4430     return;
4431
4432   /* Check BND prefix.  */
4433   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4434     as_bad (_("expecting valid branch instruction after `bnd'"));
4435
4436   /* Check NOTRACK prefix.  */
4437   if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4438     as_bad (_("expecting indirect branch instruction after `notrack'"));
4439
4440   if (i.tm.cpu_flags.bitfield.cpumpx)
4441     {
4442       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4443         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4444       else if (flag_code != CODE_16BIT
4445                ? i.prefix[ADDR_PREFIX]
4446                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4447         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4448     }
4449
4450   /* Insert BND prefix.  */
4451   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4452     {
4453       if (!i.prefix[BND_PREFIX])
4454         add_prefix (BND_PREFIX_OPCODE);
4455       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4456         {
4457           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4458           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4459         }
4460     }
4461
4462   /* Check string instruction segment overrides.  */
4463   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4464     {
4465       gas_assert (i.mem_operands);
4466       if (!check_string ())
4467         return;
4468       i.disp_operands = 0;
4469     }
4470
4471   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4472     optimize_encoding ();
4473
4474   if (!process_suffix ())
4475     return;
4476
4477   /* Update operand types.  */
4478   for (j = 0; j < i.operands; j++)
4479     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4480
4481   /* Make still unresolved immediate matches conform to size of immediate
4482      given in i.suffix.  */
4483   if (!finalize_imm ())
4484     return;
4485
4486   if (i.types[0].bitfield.imm1)
4487     i.imm_operands = 0; /* kludge for shift insns.  */
4488
4489   /* We only need to check those implicit registers for instructions
4490      with 3 operands or less.  */
4491   if (i.operands <= 3)
4492     for (j = 0; j < i.operands; j++)
4493       if (i.types[j].bitfield.instance != InstanceNone
4494           && !i.types[j].bitfield.xmmword)
4495         i.reg_operands--;
4496
4497   /* ImmExt should be processed after SSE2AVX.  */
4498   if (!i.tm.opcode_modifier.sse2avx
4499       && i.tm.opcode_modifier.immext)
4500     process_immext ();
4501
4502   /* For insns with operands there are more diddles to do to the opcode.  */
4503   if (i.operands)
4504     {
4505       if (!process_operands ())
4506         return;
4507     }
4508   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4509     {
4510       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4511       as_warn (_("translating to `%sp'"), i.tm.name);
4512     }
4513
4514   if (is_any_vex_encoding (&i.tm))
4515     {
4516       if (!cpu_arch_flags.bitfield.cpui286)
4517         {
4518           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4519                   i.tm.name);
4520           return;
4521         }
4522
4523       if (i.tm.opcode_modifier.vex)
4524         build_vex_prefix (t);
4525       else
4526         build_evex_prefix ();
4527     }
4528
4529   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4530      instructions may define INT_OPCODE as well, so avoid this corner
4531      case for those instructions that use MODRM.  */
4532   if (i.tm.base_opcode == INT_OPCODE
4533       && !i.tm.opcode_modifier.modrm
4534       && i.op[0].imms->X_add_number == 3)
4535     {
4536       i.tm.base_opcode = INT3_OPCODE;
4537       i.imm_operands = 0;
4538     }
4539
4540   if ((i.tm.opcode_modifier.jump == JUMP
4541        || i.tm.opcode_modifier.jump == JUMP_BYTE
4542        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4543       && i.op[0].disps->X_op == O_constant)
4544     {
4545       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4546          the absolute address given by the constant.  Since ix86 jumps and
4547          calls are pc relative, we need to generate a reloc.  */
4548       i.op[0].disps->X_add_symbol = &abs_symbol;
4549       i.op[0].disps->X_op = O_symbol;
4550     }
4551
4552   if (i.tm.opcode_modifier.rex64)
4553     i.rex |= REX_W;
4554
4555   /* For 8 bit registers we need an empty rex prefix.  Also if the
4556      instruction already has a prefix, we need to convert old
4557      registers to new ones.  */
4558
4559   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4560        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4561       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4562           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4563       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4564            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4565           && i.rex != 0))
4566     {
4567       int x;
4568
4569       i.rex |= REX_OPCODE;
4570       for (x = 0; x < 2; x++)
4571         {
4572           /* Look for 8 bit operand that uses old registers.  */
4573           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4574               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4575             {
4576               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4577               /* In case it is "hi" register, give up.  */
4578               if (i.op[x].regs->reg_num > 3)
4579                 as_bad (_("can't encode register '%s%s' in an "
4580                           "instruction requiring REX prefix."),
4581                         register_prefix, i.op[x].regs->reg_name);
4582
4583               /* Otherwise it is equivalent to the extended register.
4584                  Since the encoding doesn't change this is merely
4585                  cosmetic cleanup for debug output.  */
4586
4587               i.op[x].regs = i.op[x].regs + 8;
4588             }
4589         }
4590     }
4591
4592   if (i.rex == 0 && i.rex_encoding)
4593     {
4594       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4595          that uses legacy register.  If it is "hi" register, don't add
4596          the REX_OPCODE byte.  */
4597       int x;
4598       for (x = 0; x < 2; x++)
4599         if (i.types[x].bitfield.class == Reg
4600             && i.types[x].bitfield.byte
4601             && (i.op[x].regs->reg_flags & RegRex64) == 0
4602             && i.op[x].regs->reg_num > 3)
4603           {
4604             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4605             i.rex_encoding = FALSE;
4606             break;
4607           }
4608
4609       if (i.rex_encoding)
4610         i.rex = REX_OPCODE;
4611     }
4612
4613   if (i.rex != 0)
4614     add_prefix (REX_OPCODE | i.rex);
4615
4616   /* We are ready to output the insn.  */
4617   output_insn ();
4618
4619   last_insn.seg = now_seg;
4620
4621   if (i.tm.opcode_modifier.isprefix)
4622     {
4623       last_insn.kind = last_insn_prefix;
4624       last_insn.name = i.tm.name;
4625       last_insn.file = as_where (&last_insn.line);
4626     }
4627   else
4628     last_insn.kind = last_insn_other;
4629 }
4630
4631 static char *
4632 parse_insn (char *line, char *mnemonic)
4633 {
4634   char *l = line;
4635   char *token_start = l;
4636   char *mnem_p;
4637   int supported;
4638   const insn_template *t;
4639   char *dot_p = NULL;
4640
4641   while (1)
4642     {
4643       mnem_p = mnemonic;
4644       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4645         {
4646           if (*mnem_p == '.')
4647             dot_p = mnem_p;
4648           mnem_p++;
4649           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4650             {
4651               as_bad (_("no such instruction: `%s'"), token_start);
4652               return NULL;
4653             }
4654           l++;
4655         }
4656       if (!is_space_char (*l)
4657           && *l != END_OF_INSN
4658           && (intel_syntax
4659               || (*l != PREFIX_SEPARATOR
4660                   && *l != ',')))
4661         {
4662           as_bad (_("invalid character %s in mnemonic"),
4663                   output_invalid (*l));
4664           return NULL;
4665         }
4666       if (token_start == l)
4667         {
4668           if (!intel_syntax && *l == PREFIX_SEPARATOR)
4669             as_bad (_("expecting prefix; got nothing"));
4670           else
4671             as_bad (_("expecting mnemonic; got nothing"));
4672           return NULL;
4673         }
4674
4675       /* Look up instruction (or prefix) via hash table.  */
4676       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4677
4678       if (*l != END_OF_INSN
4679           && (!is_space_char (*l) || l[1] != END_OF_INSN)
4680           && current_templates
4681           && current_templates->start->opcode_modifier.isprefix)
4682         {
4683           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4684             {
4685               as_bad ((flag_code != CODE_64BIT
4686                        ? _("`%s' is only supported in 64-bit mode")
4687                        : _("`%s' is not supported in 64-bit mode")),
4688                       current_templates->start->name);
4689               return NULL;
4690             }
4691           /* If we are in 16-bit mode, do not allow addr16 or data16.
4692              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
4693           if ((current_templates->start->opcode_modifier.size == SIZE16
4694                || current_templates->start->opcode_modifier.size == SIZE32)
4695               && flag_code != CODE_64BIT
4696               && ((current_templates->start->opcode_modifier.size == SIZE32)
4697                   ^ (flag_code == CODE_16BIT)))
4698             {
4699               as_bad (_("redundant %s prefix"),
4700                       current_templates->start->name);
4701               return NULL;
4702             }
4703           if (current_templates->start->opcode_length == 0)
4704             {
4705               /* Handle pseudo prefixes.  */
4706               switch (current_templates->start->base_opcode)
4707                 {
4708                 case 0x0:
4709                   /* {disp8} */
4710                   i.disp_encoding = disp_encoding_8bit;
4711                   break;
4712                 case 0x1:
4713                   /* {disp32} */
4714                   i.disp_encoding = disp_encoding_32bit;
4715                   break;
4716                 case 0x2:
4717                   /* {load} */
4718                   i.dir_encoding = dir_encoding_load;
4719                   break;
4720                 case 0x3:
4721                   /* {store} */
4722                   i.dir_encoding = dir_encoding_store;
4723                   break;
4724                 case 0x4:
4725                   /* {vex} */
4726                   i.vec_encoding = vex_encoding_vex;
4727                   break;
4728                 case 0x5:
4729                   /* {vex3} */
4730                   i.vec_encoding = vex_encoding_vex3;
4731                   break;
4732                 case 0x6:
4733                   /* {evex} */
4734                   i.vec_encoding = vex_encoding_evex;
4735                   break;
4736                 case 0x7:
4737                   /* {rex} */
4738                   i.rex_encoding = TRUE;
4739                   break;
4740                 case 0x8:
4741                   /* {nooptimize} */
4742                   i.no_optimize = TRUE;
4743                   break;
4744                 default:
4745                   abort ();
4746                 }
4747             }
4748           else
4749             {
4750               /* Add prefix, checking for repeated prefixes.  */
4751               switch (add_prefix (current_templates->start->base_opcode))
4752                 {
4753                 case PREFIX_EXIST:
4754                   return NULL;
4755                 case PREFIX_DS:
4756                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
4757                     i.notrack_prefix = current_templates->start->name;
4758                   break;
4759                 case PREFIX_REP:
4760                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
4761                     i.hle_prefix = current_templates->start->name;
4762                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4763                     i.bnd_prefix = current_templates->start->name;
4764                   else
4765                     i.rep_prefix = current_templates->start->name;
4766                   break;
4767                 default:
4768                   break;
4769                 }
4770             }
4771           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
4772           token_start = ++l;
4773         }
4774       else
4775         break;
4776     }
4777
4778   if (!current_templates)
4779     {
4780       /* Deprecated functionality (new code should use pseudo-prefixes instead):
4781          Check if we should swap operand or force 32bit displacement in
4782          encoding.  */
4783       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4784         i.dir_encoding = dir_encoding_swap;
4785       else if (mnem_p - 3 == dot_p
4786                && dot_p[1] == 'd'
4787                && dot_p[2] == '8')
4788         i.disp_encoding = disp_encoding_8bit;
4789       else if (mnem_p - 4 == dot_p
4790                && dot_p[1] == 'd'
4791                && dot_p[2] == '3'
4792                && dot_p[3] == '2')
4793         i.disp_encoding = disp_encoding_32bit;
4794       else
4795         goto check_suffix;
4796       mnem_p = dot_p;
4797       *dot_p = '\0';
4798       current_templates = (const templates *) hash_find (op_hash, mnemonic);
4799     }
4800
4801   if (!current_templates)
4802     {
4803 check_suffix:
4804       if (mnem_p > mnemonic)
4805         {
4806           /* See if we can get a match by trimming off a suffix.  */
4807           switch (mnem_p[-1])
4808             {
4809             case WORD_MNEM_SUFFIX:
4810               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4811                 i.suffix = SHORT_MNEM_SUFFIX;
4812               else
4813                 /* Fall through.  */
4814               case BYTE_MNEM_SUFFIX:
4815               case QWORD_MNEM_SUFFIX:
4816                 i.suffix = mnem_p[-1];
4817               mnem_p[-1] = '\0';
4818               current_templates = (const templates *) hash_find (op_hash,
4819                                                                  mnemonic);
4820               break;
4821             case SHORT_MNEM_SUFFIX:
4822             case LONG_MNEM_SUFFIX:
4823               if (!intel_syntax)
4824                 {
4825                   i.suffix = mnem_p[-1];
4826                   mnem_p[-1] = '\0';
4827                   current_templates = (const templates *) hash_find (op_hash,
4828                                                                      mnemonic);
4829                 }
4830               break;
4831
4832               /* Intel Syntax.  */
4833             case 'd':
4834               if (intel_syntax)
4835                 {
4836                   if (intel_float_operand (mnemonic) == 1)
4837                     i.suffix = SHORT_MNEM_SUFFIX;
4838                   else
4839                     i.suffix = LONG_MNEM_SUFFIX;
4840                   mnem_p[-1] = '\0';
4841                   current_templates = (const templates *) hash_find (op_hash,
4842                                                                      mnemonic);
4843                 }
4844               break;
4845             }
4846         }
4847
4848       if (!current_templates)
4849         {
4850           as_bad (_("no such instruction: `%s'"), token_start);
4851           return NULL;
4852         }
4853     }
4854
4855   if (current_templates->start->opcode_modifier.jump == JUMP
4856       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4857     {
4858       /* Check for a branch hint.  We allow ",pt" and ",pn" for
4859          predict taken and predict not taken respectively.
4860          I'm not sure that branch hints actually do anything on loop
4861          and jcxz insns (JumpByte) for current Pentium4 chips.  They
4862          may work in the future and it doesn't hurt to accept them
4863          now.  */
4864       if (l[0] == ',' && l[1] == 'p')
4865         {
4866           if (l[2] == 't')
4867             {
4868               if (!add_prefix (DS_PREFIX_OPCODE))
4869                 return NULL;
4870               l += 3;
4871             }
4872           else if (l[2] == 'n')
4873             {
4874               if (!add_prefix (CS_PREFIX_OPCODE))
4875                 return NULL;
4876               l += 3;
4877             }
4878         }
4879     }
4880   /* Any other comma loses.  */
4881   if (*l == ',')
4882     {
4883       as_bad (_("invalid character %s in mnemonic"),
4884               output_invalid (*l));
4885       return NULL;
4886     }
4887
4888   /* Check if instruction is supported on specified architecture.  */
4889   supported = 0;
4890   for (t = current_templates->start; t < current_templates->end; ++t)
4891     {
4892       supported |= cpu_flags_match (t);
4893       if (supported == CPU_FLAGS_PERFECT_MATCH)
4894         {
4895           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4896             as_warn (_("use .code16 to ensure correct addressing mode"));
4897
4898           return l;
4899         }
4900     }
4901
4902   if (!(supported & CPU_FLAGS_64BIT_MATCH))
4903     as_bad (flag_code == CODE_64BIT
4904             ? _("`%s' is not supported in 64-bit mode")
4905             : _("`%s' is only supported in 64-bit mode"),
4906             current_templates->start->name);
4907   else
4908     as_bad (_("`%s' is not supported on `%s%s'"),
4909             current_templates->start->name,
4910             cpu_arch_name ? cpu_arch_name : default_arch,
4911             cpu_sub_arch_name ? cpu_sub_arch_name : "");
4912
4913   return NULL;
4914 }
4915
4916 static char *
4917 parse_operands (char *l, const char *mnemonic)
4918 {
4919   char *token_start;
4920
4921   /* 1 if operand is pending after ','.  */
4922   unsigned int expecting_operand = 0;
4923
4924   /* Non-zero if operand parens not balanced.  */
4925   unsigned int paren_not_balanced;
4926
4927   while (*l != END_OF_INSN)
4928     {
4929       /* Skip optional white space before operand.  */
4930       if (is_space_char (*l))
4931         ++l;
4932       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4933         {
4934           as_bad (_("invalid character %s before operand %d"),
4935                   output_invalid (*l),
4936                   i.operands + 1);
4937           return NULL;
4938         }
4939       token_start = l;  /* After white space.  */
4940       paren_not_balanced = 0;
4941       while (paren_not_balanced || *l != ',')
4942         {
4943           if (*l == END_OF_INSN)
4944             {
4945               if (paren_not_balanced)
4946                 {
4947                   if (!intel_syntax)
4948                     as_bad (_("unbalanced parenthesis in operand %d."),
4949                             i.operands + 1);
4950                   else
4951                     as_bad (_("unbalanced brackets in operand %d."),
4952                             i.operands + 1);
4953                   return NULL;
4954                 }
4955               else
4956                 break;  /* we are done */
4957             }
4958           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4959             {
4960               as_bad (_("invalid character %s in operand %d"),
4961                       output_invalid (*l),
4962                       i.operands + 1);
4963               return NULL;
4964             }
4965           if (!intel_syntax)
4966             {
4967               if (*l == '(')
4968                 ++paren_not_balanced;
4969               if (*l == ')')
4970                 --paren_not_balanced;
4971             }
4972           else
4973             {
4974               if (*l == '[')
4975                 ++paren_not_balanced;
4976               if (*l == ']')
4977                 --paren_not_balanced;
4978             }
4979           l++;
4980         }
4981       if (l != token_start)
4982         {                       /* Yes, we've read in another operand.  */
4983           unsigned int operand_ok;
4984           this_operand = i.operands++;
4985           if (i.operands > MAX_OPERANDS)
4986             {
4987               as_bad (_("spurious operands; (%d operands/instruction max)"),
4988                       MAX_OPERANDS);
4989               return NULL;
4990             }
4991           i.types[this_operand].bitfield.unspecified = 1;
4992           /* Now parse operand adding info to 'i' as we go along.  */
4993           END_STRING_AND_SAVE (l);
4994
4995           if (i.mem_operands > 1)
4996             {
4997               as_bad (_("too many memory references for `%s'"),
4998                       mnemonic);
4999               return 0;
5000             }
5001
5002           if (intel_syntax)
5003             operand_ok =
5004               i386_intel_operand (token_start,
5005                                   intel_float_operand (mnemonic));
5006           else
5007             operand_ok = i386_att_operand (token_start);
5008
5009           RESTORE_END_STRING (l);
5010           if (!operand_ok)
5011             return NULL;
5012         }
5013       else
5014         {
5015           if (expecting_operand)
5016             {
5017             expecting_operand_after_comma:
5018               as_bad (_("expecting operand after ','; got nothing"));
5019               return NULL;
5020             }
5021           if (*l == ',')
5022             {
5023               as_bad (_("expecting operand before ','; got nothing"));
5024               return NULL;
5025             }
5026         }
5027
5028       /* Now *l must be either ',' or END_OF_INSN.  */
5029       if (*l == ',')
5030         {
5031           if (*++l == END_OF_INSN)
5032             {
5033               /* Just skip it, if it's \n complain.  */
5034               goto expecting_operand_after_comma;
5035             }
5036           expecting_operand = 1;
5037         }
5038     }
5039   return l;
5040 }
5041
5042 static void
5043 swap_2_operands (int xchg1, int xchg2)
5044 {
5045   union i386_op temp_op;
5046   i386_operand_type temp_type;
5047   unsigned int temp_flags;
5048   enum bfd_reloc_code_real temp_reloc;
5049
5050   temp_type = i.types[xchg2];
5051   i.types[xchg2] = i.types[xchg1];
5052   i.types[xchg1] = temp_type;
5053
5054   temp_flags = i.flags[xchg2];
5055   i.flags[xchg2] = i.flags[xchg1];
5056   i.flags[xchg1] = temp_flags;
5057
5058   temp_op = i.op[xchg2];
5059   i.op[xchg2] = i.op[xchg1];
5060   i.op[xchg1] = temp_op;
5061
5062   temp_reloc = i.reloc[xchg2];
5063   i.reloc[xchg2] = i.reloc[xchg1];
5064   i.reloc[xchg1] = temp_reloc;
5065
5066   if (i.mask)
5067     {
5068       if (i.mask->operand == xchg1)
5069         i.mask->operand = xchg2;
5070       else if (i.mask->operand == xchg2)
5071         i.mask->operand = xchg1;
5072     }
5073   if (i.broadcast)
5074     {
5075       if (i.broadcast->operand == xchg1)
5076         i.broadcast->operand = xchg2;
5077       else if (i.broadcast->operand == xchg2)
5078         i.broadcast->operand = xchg1;
5079     }
5080   if (i.rounding)
5081     {
5082       if (i.rounding->operand == xchg1)
5083         i.rounding->operand = xchg2;
5084       else if (i.rounding->operand == xchg2)
5085         i.rounding->operand = xchg1;
5086     }
5087 }
5088
5089 static void
5090 swap_operands (void)
5091 {
5092   switch (i.operands)
5093     {
5094     case 5:
5095     case 4:
5096       swap_2_operands (1, i.operands - 2);
5097       /* Fall through.  */
5098     case 3:
5099     case 2:
5100       swap_2_operands (0, i.operands - 1);
5101       break;
5102     default:
5103       abort ();
5104     }
5105
5106   if (i.mem_operands == 2)
5107     {
5108       const seg_entry *temp_seg;
5109       temp_seg = i.seg[0];
5110       i.seg[0] = i.seg[1];
5111       i.seg[1] = temp_seg;
5112     }
5113 }
5114
5115 /* Try to ensure constant immediates are represented in the smallest
5116    opcode possible.  */
5117 static void
5118 optimize_imm (void)
5119 {
5120   char guess_suffix = 0;
5121   int op;
5122
5123   if (i.suffix)
5124     guess_suffix = i.suffix;
5125   else if (i.reg_operands)
5126     {
5127       /* Figure out a suffix from the last register operand specified.
5128          We can't do this properly yet, i.e. excluding special register
5129          instances, but the following works for instructions with
5130          immediates.  In any case, we can't set i.suffix yet.  */
5131       for (op = i.operands; --op >= 0;)
5132         if (i.types[op].bitfield.class != Reg)
5133           continue;
5134         else if (i.types[op].bitfield.byte)
5135           {
5136             guess_suffix = BYTE_MNEM_SUFFIX;
5137             break;
5138           }
5139         else if (i.types[op].bitfield.word)
5140           {
5141             guess_suffix = WORD_MNEM_SUFFIX;
5142             break;
5143           }
5144         else if (i.types[op].bitfield.dword)
5145           {
5146             guess_suffix = LONG_MNEM_SUFFIX;
5147             break;
5148           }
5149         else if (i.types[op].bitfield.qword)
5150           {
5151             guess_suffix = QWORD_MNEM_SUFFIX;
5152             break;
5153           }
5154     }
5155   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5156     guess_suffix = WORD_MNEM_SUFFIX;
5157
5158   for (op = i.operands; --op >= 0;)
5159     if (operand_type_check (i.types[op], imm))
5160       {
5161         switch (i.op[op].imms->X_op)
5162           {
5163           case O_constant:
5164             /* If a suffix is given, this operand may be shortened.  */
5165             switch (guess_suffix)
5166               {
5167               case LONG_MNEM_SUFFIX:
5168                 i.types[op].bitfield.imm32 = 1;
5169                 i.types[op].bitfield.imm64 = 1;
5170                 break;
5171               case WORD_MNEM_SUFFIX:
5172                 i.types[op].bitfield.imm16 = 1;
5173                 i.types[op].bitfield.imm32 = 1;
5174                 i.types[op].bitfield.imm32s = 1;
5175                 i.types[op].bitfield.imm64 = 1;
5176                 break;
5177               case BYTE_MNEM_SUFFIX:
5178                 i.types[op].bitfield.imm8 = 1;
5179                 i.types[op].bitfield.imm8s = 1;
5180                 i.types[op].bitfield.imm16 = 1;
5181                 i.types[op].bitfield.imm32 = 1;
5182                 i.types[op].bitfield.imm32s = 1;
5183                 i.types[op].bitfield.imm64 = 1;
5184                 break;
5185               }
5186
5187             /* If this operand is at most 16 bits, convert it
5188                to a signed 16 bit number before trying to see
5189                whether it will fit in an even smaller size.
5190                This allows a 16-bit operand such as $0xffe0 to
5191                be recognised as within Imm8S range.  */
5192             if ((i.types[op].bitfield.imm16)
5193                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5194               {
5195                 i.op[op].imms->X_add_number =
5196                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5197               }
5198 #ifdef BFD64
5199             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5200             if ((i.types[op].bitfield.imm32)
5201                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5202                     == 0))
5203               {
5204                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5205                                                 ^ ((offsetT) 1 << 31))
5206                                                - ((offsetT) 1 << 31));
5207               }
5208 #endif
5209             i.types[op]
5210               = operand_type_or (i.types[op],
5211                                  smallest_imm_type (i.op[op].imms->X_add_number));
5212
5213             /* We must avoid matching of Imm32 templates when 64bit
5214                only immediate is available.  */
5215             if (guess_suffix == QWORD_MNEM_SUFFIX)
5216               i.types[op].bitfield.imm32 = 0;
5217             break;
5218
5219           case O_absent:
5220           case O_register:
5221             abort ();
5222
5223             /* Symbols and expressions.  */
5224           default:
5225             /* Convert symbolic operand to proper sizes for matching, but don't
5226                prevent matching a set of insns that only supports sizes other
5227                than those matching the insn suffix.  */
5228             {
5229               i386_operand_type mask, allowed;
5230               const insn_template *t;
5231
5232               operand_type_set (&mask, 0);
5233               operand_type_set (&allowed, 0);
5234
5235               for (t = current_templates->start;
5236                    t < current_templates->end;
5237                    ++t)
5238                 {
5239                   allowed = operand_type_or (allowed, t->operand_types[op]);
5240                   allowed = operand_type_and (allowed, anyimm);
5241                 }
5242               switch (guess_suffix)
5243                 {
5244                 case QWORD_MNEM_SUFFIX:
5245                   mask.bitfield.imm64 = 1;
5246                   mask.bitfield.imm32s = 1;
5247                   break;
5248                 case LONG_MNEM_SUFFIX:
5249                   mask.bitfield.imm32 = 1;
5250                   break;
5251                 case WORD_MNEM_SUFFIX:
5252                   mask.bitfield.imm16 = 1;
5253                   break;
5254                 case BYTE_MNEM_SUFFIX:
5255                   mask.bitfield.imm8 = 1;
5256                   break;
5257                 default:
5258                   break;
5259                 }
5260               allowed = operand_type_and (mask, allowed);
5261               if (!operand_type_all_zero (&allowed))
5262                 i.types[op] = operand_type_and (i.types[op], mask);
5263             }
5264             break;
5265           }
5266       }
5267 }
5268
5269 /* Try to use the smallest displacement type too.  */
5270 static void
5271 optimize_disp (void)
5272 {
5273   int op;
5274
5275   for (op = i.operands; --op >= 0;)
5276     if (operand_type_check (i.types[op], disp))
5277       {
5278         if (i.op[op].disps->X_op == O_constant)
5279           {
5280             offsetT op_disp = i.op[op].disps->X_add_number;
5281
5282             if (i.types[op].bitfield.disp16
5283                 && (op_disp & ~(offsetT) 0xffff) == 0)
5284               {
5285                 /* If this operand is at most 16 bits, convert
5286                    to a signed 16 bit number and don't use 64bit
5287                    displacement.  */
5288                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5289                 i.types[op].bitfield.disp64 = 0;
5290               }
5291 #ifdef BFD64
5292             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5293             if (i.types[op].bitfield.disp32
5294                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5295               {
5296                 /* If this operand is at most 32 bits, convert
5297                    to a signed 32 bit number and don't use 64bit
5298                    displacement.  */
5299                 op_disp &= (((offsetT) 2 << 31) - 1);
5300                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5301                 i.types[op].bitfield.disp64 = 0;
5302               }
5303 #endif
5304             if (!op_disp && i.types[op].bitfield.baseindex)
5305               {
5306                 i.types[op].bitfield.disp8 = 0;
5307                 i.types[op].bitfield.disp16 = 0;
5308                 i.types[op].bitfield.disp32 = 0;
5309                 i.types[op].bitfield.disp32s = 0;
5310                 i.types[op].bitfield.disp64 = 0;
5311                 i.op[op].disps = 0;
5312                 i.disp_operands--;
5313               }
5314             else if (flag_code == CODE_64BIT)
5315               {
5316                 if (fits_in_signed_long (op_disp))
5317                   {
5318                     i.types[op].bitfield.disp64 = 0;
5319                     i.types[op].bitfield.disp32s = 1;
5320                   }
5321                 if (i.prefix[ADDR_PREFIX]
5322                     && fits_in_unsigned_long (op_disp))
5323                   i.types[op].bitfield.disp32 = 1;
5324               }
5325             if ((i.types[op].bitfield.disp32
5326                  || i.types[op].bitfield.disp32s
5327                  || i.types[op].bitfield.disp16)
5328                 && fits_in_disp8 (op_disp))
5329               i.types[op].bitfield.disp8 = 1;
5330           }
5331         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5332                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5333           {
5334             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5335                          i.op[op].disps, 0, i.reloc[op]);
5336             i.types[op].bitfield.disp8 = 0;
5337             i.types[op].bitfield.disp16 = 0;
5338             i.types[op].bitfield.disp32 = 0;
5339             i.types[op].bitfield.disp32s = 0;
5340             i.types[op].bitfield.disp64 = 0;
5341           }
5342         else
5343           /* We only support 64bit displacement on constants.  */
5344           i.types[op].bitfield.disp64 = 0;
5345       }
5346 }
5347
5348 /* Return 1 if there is a match in broadcast bytes between operand
5349    GIVEN and instruction template T.   */
5350
5351 static INLINE int
5352 match_broadcast_size (const insn_template *t, unsigned int given)
5353 {
5354   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5355            && i.types[given].bitfield.byte)
5356           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5357               && i.types[given].bitfield.word)
5358           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5359               && i.types[given].bitfield.dword)
5360           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5361               && i.types[given].bitfield.qword));
5362 }
5363
5364 /* Check if operands are valid for the instruction.  */
5365
5366 static int
5367 check_VecOperands (const insn_template *t)
5368 {
5369   unsigned int op;
5370   i386_cpu_flags cpu;
5371   static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5372
5373   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5374      any one operand are implicity requiring AVX512VL support if the actual
5375      operand size is YMMword or XMMword.  Since this function runs after
5376      template matching, there's no need to check for YMMword/XMMword in
5377      the template.  */
5378   cpu = cpu_flags_and (t->cpu_flags, avx512);
5379   if (!cpu_flags_all_zero (&cpu)
5380       && !t->cpu_flags.bitfield.cpuavx512vl
5381       && !cpu_arch_flags.bitfield.cpuavx512vl)
5382     {
5383       for (op = 0; op < t->operands; ++op)
5384         {
5385           if (t->operand_types[op].bitfield.zmmword
5386               && (i.types[op].bitfield.ymmword
5387                   || i.types[op].bitfield.xmmword))
5388             {
5389               i.error = unsupported;
5390               return 1;
5391             }
5392         }
5393     }
5394
5395   /* Without VSIB byte, we can't have a vector register for index.  */
5396   if (!t->opcode_modifier.vecsib
5397       && i.index_reg
5398       && (i.index_reg->reg_type.bitfield.xmmword
5399           || i.index_reg->reg_type.bitfield.ymmword
5400           || i.index_reg->reg_type.bitfield.zmmword))
5401     {
5402       i.error = unsupported_vector_index_register;
5403       return 1;
5404     }
5405
5406   /* Check if default mask is allowed.  */
5407   if (t->opcode_modifier.nodefmask
5408       && (!i.mask || i.mask->mask->reg_num == 0))
5409     {
5410       i.error = no_default_mask;
5411       return 1;
5412     }
5413
5414   /* For VSIB byte, we need a vector register for index, and all vector
5415      registers must be distinct.  */
5416   if (t->opcode_modifier.vecsib)
5417     {
5418       if (!i.index_reg
5419           || !((t->opcode_modifier.vecsib == VecSIB128
5420                 && i.index_reg->reg_type.bitfield.xmmword)
5421                || (t->opcode_modifier.vecsib == VecSIB256
5422                    && i.index_reg->reg_type.bitfield.ymmword)
5423                || (t->opcode_modifier.vecsib == VecSIB512
5424                    && i.index_reg->reg_type.bitfield.zmmword)))
5425       {
5426         i.error = invalid_vsib_address;
5427         return 1;
5428       }
5429
5430       gas_assert (i.reg_operands == 2 || i.mask);
5431       if (i.reg_operands == 2 && !i.mask)
5432         {
5433           gas_assert (i.types[0].bitfield.class == RegSIMD);
5434           gas_assert (i.types[0].bitfield.xmmword
5435                       || i.types[0].bitfield.ymmword);
5436           gas_assert (i.types[2].bitfield.class == RegSIMD);
5437           gas_assert (i.types[2].bitfield.xmmword
5438                       || i.types[2].bitfield.ymmword);
5439           if (operand_check == check_none)
5440             return 0;
5441           if (register_number (i.op[0].regs)
5442               != register_number (i.index_reg)
5443               && register_number (i.op[2].regs)
5444                  != register_number (i.index_reg)
5445               && register_number (i.op[0].regs)
5446                  != register_number (i.op[2].regs))
5447             return 0;
5448           if (operand_check == check_error)
5449             {
5450               i.error = invalid_vector_register_set;
5451               return 1;
5452             }
5453           as_warn (_("mask, index, and destination registers should be distinct"));
5454         }
5455       else if (i.reg_operands == 1 && i.mask)
5456         {
5457           if (i.types[1].bitfield.class == RegSIMD
5458               && (i.types[1].bitfield.xmmword
5459                   || i.types[1].bitfield.ymmword
5460                   || i.types[1].bitfield.zmmword)
5461               && (register_number (i.op[1].regs)
5462                   == register_number (i.index_reg)))
5463             {
5464               if (operand_check == check_error)
5465                 {
5466                   i.error = invalid_vector_register_set;
5467                   return 1;
5468                 }
5469               if (operand_check != check_none)
5470                 as_warn (_("index and destination registers should be distinct"));
5471             }
5472         }
5473     }
5474
5475   /* Check if broadcast is supported by the instruction and is applied
5476      to the memory operand.  */
5477   if (i.broadcast)
5478     {
5479       i386_operand_type type, overlap;
5480
5481       /* Check if specified broadcast is supported in this instruction,
5482          and its broadcast bytes match the memory operand.  */
5483       op = i.broadcast->operand;
5484       if (!t->opcode_modifier.broadcast
5485           || !(i.flags[op] & Operand_Mem)
5486           || (!i.types[op].bitfield.unspecified
5487               && !match_broadcast_size (t, op)))
5488         {
5489         bad_broadcast:
5490           i.error = unsupported_broadcast;
5491           return 1;
5492         }
5493
5494       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5495                             * i.broadcast->type);
5496       operand_type_set (&type, 0);
5497       switch (i.broadcast->bytes)
5498         {
5499         case 2:
5500           type.bitfield.word = 1;
5501           break;
5502         case 4:
5503           type.bitfield.dword = 1;
5504           break;
5505         case 8:
5506           type.bitfield.qword = 1;
5507           break;
5508         case 16:
5509           type.bitfield.xmmword = 1;
5510           break;
5511         case 32:
5512           type.bitfield.ymmword = 1;
5513           break;
5514         case 64:
5515           type.bitfield.zmmword = 1;
5516           break;
5517         default:
5518           goto bad_broadcast;
5519         }
5520
5521       overlap = operand_type_and (type, t->operand_types[op]);
5522       if (operand_type_all_zero (&overlap))
5523           goto bad_broadcast;
5524
5525       if (t->opcode_modifier.checkregsize)
5526         {
5527           unsigned int j;
5528
5529           type.bitfield.baseindex = 1;
5530           for (j = 0; j < i.operands; ++j)
5531             {
5532               if (j != op
5533                   && !operand_type_register_match(i.types[j],
5534                                                   t->operand_types[j],
5535                                                   type,
5536                                                   t->operand_types[op]))
5537                 goto bad_broadcast;
5538             }
5539         }
5540     }
5541   /* If broadcast is supported in this instruction, we need to check if
5542      operand of one-element size isn't specified without broadcast.  */
5543   else if (t->opcode_modifier.broadcast && i.mem_operands)
5544     {
5545       /* Find memory operand.  */
5546       for (op = 0; op < i.operands; op++)
5547         if (i.flags[op] & Operand_Mem)
5548           break;
5549       gas_assert (op < i.operands);
5550       /* Check size of the memory operand.  */
5551       if (match_broadcast_size (t, op))
5552         {
5553           i.error = broadcast_needed;
5554           return 1;
5555         }
5556     }
5557   else
5558     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5559
5560   /* Check if requested masking is supported.  */
5561   if (i.mask)
5562     {
5563       switch (t->opcode_modifier.masking)
5564         {
5565         case BOTH_MASKING:
5566           break;
5567         case MERGING_MASKING:
5568           if (i.mask->zeroing)
5569             {
5570         case 0:
5571               i.error = unsupported_masking;
5572               return 1;
5573             }
5574           break;
5575         case DYNAMIC_MASKING:
5576           /* Memory destinations allow only merging masking.  */
5577           if (i.mask->zeroing && i.mem_operands)
5578             {
5579               /* Find memory operand.  */
5580               for (op = 0; op < i.operands; op++)
5581                 if (i.flags[op] & Operand_Mem)
5582                   break;
5583               gas_assert (op < i.operands);
5584               if (op == i.operands - 1)
5585                 {
5586                   i.error = unsupported_masking;
5587                   return 1;
5588                 }
5589             }
5590           break;
5591         default:
5592           abort ();
5593         }
5594     }
5595
5596   /* Check if masking is applied to dest operand.  */
5597   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5598     {
5599       i.error = mask_not_on_destination;
5600       return 1;
5601     }
5602
5603   /* Check RC/SAE.  */
5604   if (i.rounding)
5605     {
5606       if (!t->opcode_modifier.sae
5607           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5608         {
5609           i.error = unsupported_rc_sae;
5610           return 1;
5611         }
5612       /* If the instruction has several immediate operands and one of
5613          them is rounding, the rounding operand should be the last
5614          immediate operand.  */
5615       if (i.imm_operands > 1
5616           && i.rounding->operand != (int) (i.imm_operands - 1))
5617         {
5618           i.error = rc_sae_operand_not_last_imm;
5619           return 1;
5620         }
5621     }
5622
5623   /* Check vector Disp8 operand.  */
5624   if (t->opcode_modifier.disp8memshift
5625       && i.disp_encoding != disp_encoding_32bit)
5626     {
5627       if (i.broadcast)
5628         i.memshift = t->opcode_modifier.broadcast - 1;
5629       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5630         i.memshift = t->opcode_modifier.disp8memshift;
5631       else
5632         {
5633           const i386_operand_type *type = NULL;
5634
5635           i.memshift = 0;
5636           for (op = 0; op < i.operands; op++)
5637             if (i.flags[op] & Operand_Mem)
5638               {
5639                 if (t->opcode_modifier.evex == EVEXLIG)
5640                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5641                 else if (t->operand_types[op].bitfield.xmmword
5642                          + t->operand_types[op].bitfield.ymmword
5643                          + t->operand_types[op].bitfield.zmmword <= 1)
5644                   type = &t->operand_types[op];
5645                 else if (!i.types[op].bitfield.unspecified)
5646                   type = &i.types[op];
5647               }
5648             else if (i.types[op].bitfield.class == RegSIMD
5649                      && t->opcode_modifier.evex != EVEXLIG)
5650               {
5651                 if (i.types[op].bitfield.zmmword)
5652                   i.memshift = 6;
5653                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5654                   i.memshift = 5;
5655                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5656                   i.memshift = 4;
5657               }
5658
5659           if (type)
5660             {
5661               if (type->bitfield.zmmword)
5662                 i.memshift = 6;
5663               else if (type->bitfield.ymmword)
5664                 i.memshift = 5;
5665               else if (type->bitfield.xmmword)
5666                 i.memshift = 4;
5667             }
5668
5669           /* For the check in fits_in_disp8().  */
5670           if (i.memshift == 0)
5671             i.memshift = -1;
5672         }
5673
5674       for (op = 0; op < i.operands; op++)
5675         if (operand_type_check (i.types[op], disp)
5676             && i.op[op].disps->X_op == O_constant)
5677           {
5678             if (fits_in_disp8 (i.op[op].disps->X_add_number))
5679               {
5680                 i.types[op].bitfield.disp8 = 1;
5681                 return 0;
5682               }
5683             i.types[op].bitfield.disp8 = 0;
5684           }
5685     }
5686
5687   i.memshift = 0;
5688
5689   return 0;
5690 }
5691
5692 /* Check if operands are valid for the instruction.  Update VEX
5693    operand types.  */
5694
5695 static int
5696 VEX_check_operands (const insn_template *t)
5697 {
5698   if (i.vec_encoding == vex_encoding_evex)
5699     {
5700       /* This instruction must be encoded with EVEX prefix.  */
5701       if (!is_evex_encoding (t))
5702         {
5703           i.error = unsupported;
5704           return 1;
5705         }
5706       return 0;
5707     }
5708
5709   if (!t->opcode_modifier.vex)
5710     {
5711       /* This instruction template doesn't have VEX prefix.  */
5712       if (i.vec_encoding != vex_encoding_default)
5713         {
5714           i.error = unsupported;
5715           return 1;
5716         }
5717       return 0;
5718     }
5719
5720   /* Check the special Imm4 cases; must be the first operand.  */
5721   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5722     {
5723       if (i.op[0].imms->X_op != O_constant
5724           || !fits_in_imm4 (i.op[0].imms->X_add_number))
5725         {
5726           i.error = bad_imm4;
5727           return 1;
5728         }
5729
5730       /* Turn off Imm<N> so that update_imm won't complain.  */
5731       operand_type_set (&i.types[0], 0);
5732     }
5733
5734   return 0;
5735 }
5736
5737 static const insn_template *
5738 match_template (char mnem_suffix)
5739 {
5740   /* Points to template once we've found it.  */
5741   const insn_template *t;
5742   i386_operand_type overlap0, overlap1, overlap2, overlap3;
5743   i386_operand_type overlap4;
5744   unsigned int found_reverse_match;
5745   i386_opcode_modifier suffix_check;
5746   i386_operand_type operand_types [MAX_OPERANDS];
5747   int addr_prefix_disp;
5748   unsigned int j, size_match, check_register;
5749   enum i386_error specific_error = 0;
5750
5751 #if MAX_OPERANDS != 5
5752 # error "MAX_OPERANDS must be 5."
5753 #endif
5754
5755   found_reverse_match = 0;
5756   addr_prefix_disp = -1;
5757
5758   /* Prepare for mnemonic suffix check.  */
5759   memset (&suffix_check, 0, sizeof (suffix_check));
5760   switch (mnem_suffix)
5761     {
5762     case BYTE_MNEM_SUFFIX:
5763       suffix_check.no_bsuf = 1;
5764       break;
5765     case WORD_MNEM_SUFFIX:
5766       suffix_check.no_wsuf = 1;
5767       break;
5768     case SHORT_MNEM_SUFFIX:
5769       suffix_check.no_ssuf = 1;
5770       break;
5771     case LONG_MNEM_SUFFIX:
5772       suffix_check.no_lsuf = 1;
5773       break;
5774     case QWORD_MNEM_SUFFIX:
5775       suffix_check.no_qsuf = 1;
5776       break;
5777     default:
5778       /* NB: In Intel syntax, normally we can check for memory operand
5779          size when there is no mnemonic suffix.  But jmp and call have
5780          2 different encodings with Dword memory operand size, one with
5781          No_ldSuf and the other without.  i.suffix is set to
5782          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
5783       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5784         suffix_check.no_ldsuf = 1;
5785     }
5786
5787   /* Must have right number of operands.  */
5788   i.error = number_of_operands_mismatch;
5789
5790   for (t = current_templates->start; t < current_templates->end; t++)
5791     {
5792       addr_prefix_disp = -1;
5793       found_reverse_match = 0;
5794
5795       if (i.operands != t->operands)
5796         continue;
5797
5798       /* Check processor support.  */
5799       i.error = unsupported;
5800       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
5801         continue;
5802
5803       /* Check AT&T mnemonic.   */
5804       i.error = unsupported_with_intel_mnemonic;
5805       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5806         continue;
5807
5808       /* Check AT&T/Intel syntax and Intel64/AMD64 ISA.   */
5809       i.error = unsupported_syntax;
5810       if ((intel_syntax && t->opcode_modifier.attsyntax)
5811           || (!intel_syntax && t->opcode_modifier.intelsyntax)
5812           || (intel64 && t->opcode_modifier.amd64)
5813           || (!intel64 && t->opcode_modifier.intel64))
5814         continue;
5815
5816       /* Check the suffix.  */
5817       i.error = invalid_instruction_suffix;
5818       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5819           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5820           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5821           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5822           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5823           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5824         continue;
5825
5826       size_match = operand_size_match (t);
5827       if (!size_match)
5828         continue;
5829
5830       /* This is intentionally not
5831
5832          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5833
5834          as the case of a missing * on the operand is accepted (perhaps with
5835          a warning, issued further down).  */
5836       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5837         {
5838           i.error = operand_type_mismatch;
5839           continue;
5840         }
5841
5842       for (j = 0; j < MAX_OPERANDS; j++)
5843         operand_types[j] = t->operand_types[j];
5844
5845       /* In general, don't allow 64-bit operands in 32-bit mode.  */
5846       if (i.suffix == QWORD_MNEM_SUFFIX
5847           && flag_code != CODE_64BIT
5848           && (intel_syntax
5849               ? (!t->opcode_modifier.ignoresize
5850                  && !t->opcode_modifier.broadcast
5851                  && !intel_float_operand (t->name))
5852               : intel_float_operand (t->name) != 2)
5853           && ((operand_types[0].bitfield.class != RegMMX
5854                && operand_types[0].bitfield.class != RegSIMD)
5855               || (operand_types[t->operands > 1].bitfield.class != RegMMX
5856                   && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5857           && (t->base_opcode != 0x0fc7
5858               || t->extension_opcode != 1 /* cmpxchg8b */))
5859         continue;
5860
5861       /* In general, don't allow 32-bit operands on pre-386.  */
5862       else if (i.suffix == LONG_MNEM_SUFFIX
5863                && !cpu_arch_flags.bitfield.cpui386
5864                && (intel_syntax
5865                    ? (!t->opcode_modifier.ignoresize
5866                       && !intel_float_operand (t->name))
5867                    : intel_float_operand (t->name) != 2)
5868                && ((operand_types[0].bitfield.class != RegMMX
5869                     && operand_types[0].bitfield.class != RegSIMD)
5870                    || (operand_types[t->operands > 1].bitfield.class != RegMMX
5871                        && operand_types[t->operands > 1].bitfield.class
5872                           != RegSIMD)))
5873         continue;
5874
5875       /* Do not verify operands when there are none.  */
5876       else
5877         {
5878           if (!t->operands)
5879             /* We've found a match; break out of loop.  */
5880             break;
5881         }
5882
5883       if (!t->opcode_modifier.jump
5884           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5885         {
5886           /* There should be only one Disp operand.  */
5887           for (j = 0; j < MAX_OPERANDS; j++)
5888             if (operand_type_check (operand_types[j], disp))
5889               break;
5890           if (j < MAX_OPERANDS)
5891             {
5892               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5893
5894               addr_prefix_disp = j;
5895
5896               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5897                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
5898               switch (flag_code)
5899                 {
5900                 case CODE_16BIT:
5901                   override = !override;
5902                   /* Fall through.  */
5903                 case CODE_32BIT:
5904                   if (operand_types[j].bitfield.disp32
5905                       && operand_types[j].bitfield.disp16)
5906                     {
5907                       operand_types[j].bitfield.disp16 = override;
5908                       operand_types[j].bitfield.disp32 = !override;
5909                     }
5910                   operand_types[j].bitfield.disp32s = 0;
5911                   operand_types[j].bitfield.disp64 = 0;
5912                   break;
5913
5914                 case CODE_64BIT:
5915                   if (operand_types[j].bitfield.disp32s
5916                       || operand_types[j].bitfield.disp64)
5917                     {
5918                       operand_types[j].bitfield.disp64 &= !override;
5919                       operand_types[j].bitfield.disp32s &= !override;
5920                       operand_types[j].bitfield.disp32 = override;
5921                     }
5922                   operand_types[j].bitfield.disp16 = 0;
5923                   break;
5924                 }
5925             }
5926         }
5927
5928       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
5929       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5930         continue;
5931
5932       /* We check register size if needed.  */
5933       if (t->opcode_modifier.checkregsize)
5934         {
5935           check_register = (1 << t->operands) - 1;
5936           if (i.broadcast)
5937             check_register &= ~(1 << i.broadcast->operand);
5938         }
5939       else
5940         check_register = 0;
5941
5942       overlap0 = operand_type_and (i.types[0], operand_types[0]);
5943       switch (t->operands)
5944         {
5945         case 1:
5946           if (!operand_type_match (overlap0, i.types[0]))
5947             continue;
5948           break;
5949         case 2:
5950           /* xchg %eax, %eax is a special case. It is an alias for nop
5951              only in 32bit mode and we can use opcode 0x90.  In 64bit
5952              mode, we can't use 0x90 for xchg %eax, %eax since it should
5953              zero-extend %eax to %rax.  */
5954           if (flag_code == CODE_64BIT
5955               && t->base_opcode == 0x90
5956               && i.types[0].bitfield.instance == Accum
5957               && i.types[0].bitfield.dword
5958               && i.types[1].bitfield.instance == Accum
5959               && i.types[1].bitfield.dword)
5960             continue;
5961           /* xrelease mov %eax, <disp> is another special case. It must not
5962              match the accumulator-only encoding of mov.  */
5963           if (flag_code != CODE_64BIT
5964               && i.hle_prefix
5965               && t->base_opcode == 0xa0
5966               && i.types[0].bitfield.instance == Accum
5967               && (i.flags[1] & Operand_Mem))
5968             continue;
5969           /* Fall through.  */
5970
5971         case 3:
5972           if (!(size_match & MATCH_STRAIGHT))
5973             goto check_reverse;
5974           /* Reverse direction of operands if swapping is possible in the first
5975              place (operands need to be symmetric) and
5976              - the load form is requested, and the template is a store form,
5977              - the store form is requested, and the template is a load form,
5978              - the non-default (swapped) form is requested.  */
5979           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5980           if (t->opcode_modifier.d && i.reg_operands == i.operands
5981               && !operand_type_all_zero (&overlap1))
5982             switch (i.dir_encoding)
5983               {
5984               case dir_encoding_load:
5985                 if (operand_type_check (operand_types[i.operands - 1], anymem)
5986                     || t->opcode_modifier.regmem)
5987                   goto check_reverse;
5988                 break;
5989
5990               case dir_encoding_store:
5991                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5992                     && !t->opcode_modifier.regmem)
5993                   goto check_reverse;
5994                 break;
5995
5996               case dir_encoding_swap:
5997                 goto check_reverse;
5998
5999               case dir_encoding_default:
6000                 break;
6001               }
6002           /* If we want store form, we skip the current load.  */
6003           if ((i.dir_encoding == dir_encoding_store
6004                || i.dir_encoding == dir_encoding_swap)
6005               && i.mem_operands == 0
6006               && t->opcode_modifier.load)
6007             continue;
6008           /* Fall through.  */
6009         case 4:
6010         case 5:
6011           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6012           if (!operand_type_match (overlap0, i.types[0])
6013               || !operand_type_match (overlap1, i.types[1])
6014               || ((check_register & 3) == 3
6015                   && !operand_type_register_match (i.types[0],
6016                                                    operand_types[0],
6017                                                    i.types[1],
6018                                                    operand_types[1])))
6019             {
6020               /* Check if other direction is valid ...  */
6021               if (!t->opcode_modifier.d)
6022                 continue;
6023
6024 check_reverse:
6025               if (!(size_match & MATCH_REVERSE))
6026                 continue;
6027               /* Try reversing direction of operands.  */
6028               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6029               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6030               if (!operand_type_match (overlap0, i.types[0])
6031                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6032                   || (check_register
6033                       && !operand_type_register_match (i.types[0],
6034                                                        operand_types[i.operands - 1],
6035                                                        i.types[i.operands - 1],
6036                                                        operand_types[0])))
6037                 {
6038                   /* Does not match either direction.  */
6039                   continue;
6040                 }
6041               /* found_reverse_match holds which of D or FloatR
6042                  we've found.  */
6043               if (!t->opcode_modifier.d)
6044                 found_reverse_match = 0;
6045               else if (operand_types[0].bitfield.tbyte)
6046                 found_reverse_match = Opcode_FloatD;
6047               else if (operand_types[0].bitfield.xmmword
6048                        || operand_types[i.operands - 1].bitfield.xmmword
6049                        || operand_types[0].bitfield.class == RegMMX
6050                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6051                        || is_any_vex_encoding(t))
6052                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6053                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6054               else
6055                 found_reverse_match = Opcode_D;
6056               if (t->opcode_modifier.floatr)
6057                 found_reverse_match |= Opcode_FloatR;
6058             }
6059           else
6060             {
6061               /* Found a forward 2 operand match here.  */
6062               switch (t->operands)
6063                 {
6064                 case 5:
6065                   overlap4 = operand_type_and (i.types[4],
6066                                                operand_types[4]);
6067                   /* Fall through.  */
6068                 case 4:
6069                   overlap3 = operand_type_and (i.types[3],
6070                                                operand_types[3]);
6071                   /* Fall through.  */
6072                 case 3:
6073                   overlap2 = operand_type_and (i.types[2],
6074                                                operand_types[2]);
6075                   break;
6076                 }
6077
6078               switch (t->operands)
6079                 {
6080                 case 5:
6081                   if (!operand_type_match (overlap4, i.types[4])
6082                       || !operand_type_register_match (i.types[3],
6083                                                        operand_types[3],
6084                                                        i.types[4],
6085                                                        operand_types[4]))
6086                     continue;
6087                   /* Fall through.  */
6088                 case 4:
6089                   if (!operand_type_match (overlap3, i.types[3])
6090                       || ((check_register & 0xa) == 0xa
6091                           && !operand_type_register_match (i.types[1],
6092                                                             operand_types[1],
6093                                                             i.types[3],
6094                                                             operand_types[3]))
6095                       || ((check_register & 0xc) == 0xc
6096                           && !operand_type_register_match (i.types[2],
6097                                                             operand_types[2],
6098                                                             i.types[3],
6099                                                             operand_types[3])))
6100                     continue;
6101                   /* Fall through.  */
6102                 case 3:
6103                   /* Here we make use of the fact that there are no
6104                      reverse match 3 operand instructions.  */
6105                   if (!operand_type_match (overlap2, i.types[2])
6106                       || ((check_register & 5) == 5
6107                           && !operand_type_register_match (i.types[0],
6108                                                             operand_types[0],
6109                                                             i.types[2],
6110                                                             operand_types[2]))
6111                       || ((check_register & 6) == 6
6112                           && !operand_type_register_match (i.types[1],
6113                                                             operand_types[1],
6114                                                             i.types[2],
6115                                                             operand_types[2])))
6116                     continue;
6117                   break;
6118                 }
6119             }
6120           /* Found either forward/reverse 2, 3 or 4 operand match here:
6121              slip through to break.  */
6122         }
6123
6124       /* Check if vector and VEX operands are valid.  */
6125       if (check_VecOperands (t) || VEX_check_operands (t))
6126         {
6127           specific_error = i.error;
6128           continue;
6129         }
6130
6131       /* We've found a match; break out of loop.  */
6132       break;
6133     }
6134
6135   if (t == current_templates->end)
6136     {
6137       /* We found no match.  */
6138       const char *err_msg;
6139       switch (specific_error ? specific_error : i.error)
6140         {
6141         default:
6142           abort ();
6143         case operand_size_mismatch:
6144           err_msg = _("operand size mismatch");
6145           break;
6146         case operand_type_mismatch:
6147           err_msg = _("operand type mismatch");
6148           break;
6149         case register_type_mismatch:
6150           err_msg = _("register type mismatch");
6151           break;
6152         case number_of_operands_mismatch:
6153           err_msg = _("number of operands mismatch");
6154           break;
6155         case invalid_instruction_suffix:
6156           err_msg = _("invalid instruction suffix");
6157           break;
6158         case bad_imm4:
6159           err_msg = _("constant doesn't fit in 4 bits");
6160           break;
6161         case unsupported_with_intel_mnemonic:
6162           err_msg = _("unsupported with Intel mnemonic");
6163           break;
6164         case unsupported_syntax:
6165           err_msg = _("unsupported syntax");
6166           break;
6167         case unsupported:
6168           as_bad (_("unsupported instruction `%s'"),
6169                   current_templates->start->name);
6170           return NULL;
6171         case invalid_vsib_address:
6172           err_msg = _("invalid VSIB address");
6173           break;
6174         case invalid_vector_register_set:
6175           err_msg = _("mask, index, and destination registers must be distinct");
6176           break;
6177         case unsupported_vector_index_register:
6178           err_msg = _("unsupported vector index register");
6179           break;
6180         case unsupported_broadcast:
6181           err_msg = _("unsupported broadcast");
6182           break;
6183         case broadcast_needed:
6184           err_msg = _("broadcast is needed for operand of such type");
6185           break;
6186         case unsupported_masking:
6187           err_msg = _("unsupported masking");
6188           break;
6189         case mask_not_on_destination:
6190           err_msg = _("mask not on destination operand");
6191           break;
6192         case no_default_mask:
6193           err_msg = _("default mask isn't allowed");
6194           break;
6195         case unsupported_rc_sae:
6196           err_msg = _("unsupported static rounding/sae");
6197           break;
6198         case rc_sae_operand_not_last_imm:
6199           if (intel_syntax)
6200             err_msg = _("RC/SAE operand must precede immediate operands");
6201           else
6202             err_msg = _("RC/SAE operand must follow immediate operands");
6203           break;
6204         case invalid_register_operand:
6205           err_msg = _("invalid register operand");
6206           break;
6207         }
6208       as_bad (_("%s for `%s'"), err_msg,
6209               current_templates->start->name);
6210       return NULL;
6211     }
6212
6213   if (!quiet_warnings)
6214     {
6215       if (!intel_syntax
6216           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6217         as_warn (_("indirect %s without `*'"), t->name);
6218
6219       if (t->opcode_modifier.isprefix
6220           && t->opcode_modifier.ignoresize)
6221         {
6222           /* Warn them that a data or address size prefix doesn't
6223              affect assembly of the next line of code.  */
6224           as_warn (_("stand-alone `%s' prefix"), t->name);
6225         }
6226     }
6227
6228   /* Copy the template we found.  */
6229   i.tm = *t;
6230
6231   if (addr_prefix_disp != -1)
6232     i.tm.operand_types[addr_prefix_disp]
6233       = operand_types[addr_prefix_disp];
6234
6235   if (found_reverse_match)
6236     {
6237       /* If we found a reverse match we must alter the opcode direction
6238          bit and clear/flip the regmem modifier one.  found_reverse_match
6239          holds bits to change (different for int & float insns).  */
6240
6241       i.tm.base_opcode ^= found_reverse_match;
6242
6243       i.tm.operand_types[0] = operand_types[i.operands - 1];
6244       i.tm.operand_types[i.operands - 1] = operand_types[0];
6245
6246       /* Certain SIMD insns have their load forms specified in the opcode
6247          table, and hence we need to _set_ RegMem instead of clearing it.
6248          We need to avoid setting the bit though on insns like KMOVW.  */
6249       i.tm.opcode_modifier.regmem
6250         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6251           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6252           && !i.tm.opcode_modifier.regmem;
6253     }
6254
6255   return t;
6256 }
6257
6258 static int
6259 check_string (void)
6260 {
6261   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6262   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6263
6264   if (i.seg[op] != NULL && i.seg[op] != &es)
6265     {
6266       as_bad (_("`%s' operand %u must use `%ses' segment"),
6267               i.tm.name,
6268               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6269               register_prefix);
6270       return 0;
6271     }
6272
6273   /* There's only ever one segment override allowed per instruction.
6274      This instruction possibly has a legal segment override on the
6275      second operand, so copy the segment to where non-string
6276      instructions store it, allowing common code.  */
6277   i.seg[op] = i.seg[1];
6278
6279   return 1;
6280 }
6281
6282 static int
6283 process_suffix (void)
6284 {
6285   /* If matched instruction specifies an explicit instruction mnemonic
6286      suffix, use it.  */
6287   if (i.tm.opcode_modifier.size == SIZE16)
6288     i.suffix = WORD_MNEM_SUFFIX;
6289   else if (i.tm.opcode_modifier.size == SIZE32)
6290     i.suffix = LONG_MNEM_SUFFIX;
6291   else if (i.tm.opcode_modifier.size == SIZE64)
6292     i.suffix = QWORD_MNEM_SUFFIX;
6293   else if (i.reg_operands
6294            && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6295     {
6296       /* If there's no instruction mnemonic suffix we try to invent one
6297          based on GPR operands.  */
6298       if (!i.suffix)
6299         {
6300           /* We take i.suffix from the last register operand specified,
6301              Destination register type is more significant than source
6302              register type.  crc32 in SSE4.2 prefers source register
6303              type. */
6304           unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6305
6306           while (op--)
6307             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6308                 || i.tm.operand_types[op].bitfield.instance == Accum)
6309               {
6310                 if (i.types[op].bitfield.class != Reg)
6311                   continue;
6312                 if (i.types[op].bitfield.byte)
6313                   i.suffix = BYTE_MNEM_SUFFIX;
6314                 else if (i.types[op].bitfield.word)
6315                   i.suffix = WORD_MNEM_SUFFIX;
6316                 else if (i.types[op].bitfield.dword)
6317                   i.suffix = LONG_MNEM_SUFFIX;
6318                 else if (i.types[op].bitfield.qword)
6319                   i.suffix = QWORD_MNEM_SUFFIX;
6320                 else
6321                   continue;
6322                 break;
6323               }
6324         }
6325       else if (i.suffix == BYTE_MNEM_SUFFIX)
6326         {
6327           if (intel_syntax
6328               && i.tm.opcode_modifier.ignoresize
6329               && i.tm.opcode_modifier.no_bsuf)
6330             i.suffix = 0;
6331           else if (!check_byte_reg ())
6332             return 0;
6333         }
6334       else if (i.suffix == LONG_MNEM_SUFFIX)
6335         {
6336           if (intel_syntax
6337               && i.tm.opcode_modifier.ignoresize
6338               && i.tm.opcode_modifier.no_lsuf
6339               && !i.tm.opcode_modifier.todword
6340               && !i.tm.opcode_modifier.toqword)
6341             i.suffix = 0;
6342           else if (!check_long_reg ())
6343             return 0;
6344         }
6345       else if (i.suffix == QWORD_MNEM_SUFFIX)
6346         {
6347           if (intel_syntax
6348               && i.tm.opcode_modifier.ignoresize
6349               && i.tm.opcode_modifier.no_qsuf
6350               && !i.tm.opcode_modifier.todword
6351               && !i.tm.opcode_modifier.toqword)
6352             i.suffix = 0;
6353           else if (!check_qword_reg ())
6354             return 0;
6355         }
6356       else if (i.suffix == WORD_MNEM_SUFFIX)
6357         {
6358           if (intel_syntax
6359               && i.tm.opcode_modifier.ignoresize
6360               && i.tm.opcode_modifier.no_wsuf)
6361             i.suffix = 0;
6362           else if (!check_word_reg ())
6363             return 0;
6364         }
6365       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6366         /* Do nothing if the instruction is going to ignore the prefix.  */
6367         ;
6368       else
6369         abort ();
6370     }
6371   else if (i.tm.opcode_modifier.defaultsize && !i.suffix)
6372     {
6373       i.suffix = stackop_size;
6374       if (stackop_size == LONG_MNEM_SUFFIX)
6375         {
6376           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6377              .code16gcc directive to support 16-bit mode with
6378              32-bit address.  For IRET without a suffix, generate
6379              16-bit IRET (opcode 0xcf) to return from an interrupt
6380              handler.  */
6381           if (i.tm.base_opcode == 0xcf)
6382             {
6383               i.suffix = WORD_MNEM_SUFFIX;
6384               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6385             }
6386           /* Warn about changed behavior for segment register push/pop.  */
6387           else if ((i.tm.base_opcode | 1) == 0x07)
6388             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6389                      i.tm.name);
6390         }
6391     }
6392   else if (!i.suffix
6393            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6394                || i.tm.opcode_modifier.jump == JUMP_BYTE
6395                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6396                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6397                    && i.tm.extension_opcode <= 3)))
6398     {
6399       switch (flag_code)
6400         {
6401         case CODE_64BIT:
6402           if (!i.tm.opcode_modifier.no_qsuf)
6403             {
6404               i.suffix = QWORD_MNEM_SUFFIX;
6405               break;
6406             }
6407           /* Fall through.  */
6408         case CODE_32BIT:
6409           if (!i.tm.opcode_modifier.no_lsuf)
6410             i.suffix = LONG_MNEM_SUFFIX;
6411           break;
6412         case CODE_16BIT:
6413           if (!i.tm.opcode_modifier.no_wsuf)
6414             i.suffix = WORD_MNEM_SUFFIX;
6415           break;
6416         }
6417     }
6418
6419   if (!i.suffix
6420       && (!i.tm.opcode_modifier.defaultsize
6421           /* Also cover lret/retf/iret in 64-bit mode.  */
6422           || (flag_code == CODE_64BIT
6423               && !i.tm.opcode_modifier.no_lsuf
6424               && !i.tm.opcode_modifier.no_qsuf))
6425       && !i.tm.opcode_modifier.ignoresize
6426       /* Accept FLDENV et al without suffix.  */
6427       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6428     {
6429       unsigned int suffixes;
6430
6431       suffixes = !i.tm.opcode_modifier.no_bsuf;
6432       if (!i.tm.opcode_modifier.no_wsuf)
6433         suffixes |= 1 << 1;
6434       if (!i.tm.opcode_modifier.no_lsuf)
6435         suffixes |= 1 << 2;
6436       if (!i.tm.opcode_modifier.no_ldsuf)
6437         suffixes |= 1 << 3;
6438       if (!i.tm.opcode_modifier.no_ssuf)
6439         suffixes |= 1 << 4;
6440       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6441         suffixes |= 1 << 5;
6442
6443       /* Are multiple suffixes allowed?  */
6444       if (suffixes & (suffixes - 1))
6445         {
6446           if (intel_syntax
6447               && (!i.tm.opcode_modifier.defaultsize
6448                   || operand_check == check_error))
6449             {
6450               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6451               return 0;
6452             }
6453           if (operand_check == check_error)
6454             {
6455               as_bad (_("no instruction mnemonic suffix given and "
6456                         "no register operands; can't size `%s'"), i.tm.name);
6457               return 0;
6458             }
6459           if (operand_check == check_warning)
6460             as_warn (_("%s; using default for `%s'"),
6461                        intel_syntax
6462                        ? _("ambiguous operand size")
6463                        : _("no instruction mnemonic suffix given and "
6464                            "no register operands"),
6465                        i.tm.name);
6466
6467           if (i.tm.opcode_modifier.floatmf)
6468             i.suffix = SHORT_MNEM_SUFFIX;
6469           else if (flag_code == CODE_16BIT)
6470             i.suffix = WORD_MNEM_SUFFIX;
6471           else if (!i.tm.opcode_modifier.no_lsuf)
6472             i.suffix = LONG_MNEM_SUFFIX;
6473           else
6474             i.suffix = QWORD_MNEM_SUFFIX;
6475         }
6476     }
6477
6478   /* Change the opcode based on the operand size given by i.suffix.  */
6479   switch (i.suffix)
6480     {
6481     /* Size floating point instruction.  */
6482     case LONG_MNEM_SUFFIX:
6483       if (i.tm.opcode_modifier.floatmf)
6484         {
6485           i.tm.base_opcode ^= 4;
6486           break;
6487         }
6488     /* fall through */
6489     case WORD_MNEM_SUFFIX:
6490     case QWORD_MNEM_SUFFIX:
6491       /* It's not a byte, select word/dword operation.  */
6492       if (i.tm.opcode_modifier.w)
6493         {
6494           if (i.tm.opcode_modifier.shortform)
6495             i.tm.base_opcode |= 8;
6496           else
6497             i.tm.base_opcode |= 1;
6498         }
6499     /* fall through */
6500     case SHORT_MNEM_SUFFIX:
6501       /* Now select between word & dword operations via the operand
6502          size prefix, except for instructions that will ignore this
6503          prefix anyway.  */
6504       if (i.reg_operands > 0
6505           && i.types[0].bitfield.class == Reg
6506           && i.tm.opcode_modifier.addrprefixopreg
6507           && (i.tm.operand_types[0].bitfield.instance == Accum
6508               || i.operands == 1))
6509         {
6510           /* The address size override prefix changes the size of the
6511              first operand.  */
6512           if ((flag_code == CODE_32BIT
6513                && i.op[0].regs->reg_type.bitfield.word)
6514               || (flag_code != CODE_32BIT
6515                   && i.op[0].regs->reg_type.bitfield.dword))
6516             if (!add_prefix (ADDR_PREFIX_OPCODE))
6517               return 0;
6518         }
6519       else if (i.suffix != QWORD_MNEM_SUFFIX
6520                && !i.tm.opcode_modifier.ignoresize
6521                && !i.tm.opcode_modifier.floatmf
6522                && !is_any_vex_encoding (&i.tm)
6523                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6524                    || (flag_code == CODE_64BIT
6525                        && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6526         {
6527           unsigned int prefix = DATA_PREFIX_OPCODE;
6528
6529           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6530             prefix = ADDR_PREFIX_OPCODE;
6531
6532           if (!add_prefix (prefix))
6533             return 0;
6534         }
6535
6536       /* Set mode64 for an operand.  */
6537       if (i.suffix == QWORD_MNEM_SUFFIX
6538           && flag_code == CODE_64BIT
6539           && !i.tm.opcode_modifier.norex64
6540           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
6541              need rex64. */
6542           && ! (i.operands == 2
6543                 && i.tm.base_opcode == 0x90
6544                 && i.tm.extension_opcode == None
6545                 && i.types[0].bitfield.instance == Accum
6546                 && i.types[0].bitfield.qword
6547                 && i.types[1].bitfield.instance == Accum
6548                 && i.types[1].bitfield.qword))
6549         i.rex |= REX_W;
6550
6551       break;
6552     }
6553
6554   if (i.reg_operands != 0
6555       && i.operands > 1
6556       && i.tm.opcode_modifier.addrprefixopreg
6557       && i.tm.operand_types[0].bitfield.instance != Accum)
6558     {
6559       /* Check invalid register operand when the address size override
6560          prefix changes the size of register operands.  */
6561       unsigned int op;
6562       enum { need_word, need_dword, need_qword } need;
6563
6564       if (flag_code == CODE_32BIT)
6565         need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6566       else
6567         {
6568           if (i.prefix[ADDR_PREFIX])
6569             need = need_dword;
6570           else
6571             need = flag_code == CODE_64BIT ? need_qword : need_word;
6572         }
6573
6574       for (op = 0; op < i.operands; op++)
6575         if (i.types[op].bitfield.class == Reg
6576             && ((need == need_word
6577                  && !i.op[op].regs->reg_type.bitfield.word)
6578                 || (need == need_dword
6579                     && !i.op[op].regs->reg_type.bitfield.dword)
6580                 || (need == need_qword
6581                     && !i.op[op].regs->reg_type.bitfield.qword)))
6582           {
6583             as_bad (_("invalid register operand size for `%s'"),
6584                     i.tm.name);
6585             return 0;
6586           }
6587     }
6588
6589   return 1;
6590 }
6591
6592 static int
6593 check_byte_reg (void)
6594 {
6595   int op;
6596
6597   for (op = i.operands; --op >= 0;)
6598     {
6599       /* Skip non-register operands. */
6600       if (i.types[op].bitfield.class != Reg)
6601         continue;
6602
6603       /* If this is an eight bit register, it's OK.  If it's the 16 or
6604          32 bit version of an eight bit register, we will just use the
6605          low portion, and that's OK too.  */
6606       if (i.types[op].bitfield.byte)
6607         continue;
6608
6609       /* I/O port address operands are OK too.  */
6610       if (i.tm.operand_types[op].bitfield.instance == RegD
6611           && i.tm.operand_types[op].bitfield.word)
6612         continue;
6613
6614       /* crc32 doesn't generate this warning.  */
6615       if (i.tm.base_opcode == 0xf20f38f0)
6616         continue;
6617
6618       if ((i.types[op].bitfield.word
6619            || i.types[op].bitfield.dword
6620            || i.types[op].bitfield.qword)
6621           && i.op[op].regs->reg_num < 4
6622           /* Prohibit these changes in 64bit mode, since the lowering
6623              would be more complicated.  */
6624           && flag_code != CODE_64BIT)
6625         {
6626 #if REGISTER_WARNINGS
6627           if (!quiet_warnings)
6628             as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6629                      register_prefix,
6630                      (i.op[op].regs + (i.types[op].bitfield.word
6631                                        ? REGNAM_AL - REGNAM_AX
6632                                        : REGNAM_AL - REGNAM_EAX))->reg_name,
6633                      register_prefix,
6634                      i.op[op].regs->reg_name,
6635                      i.suffix);
6636 #endif
6637           continue;
6638         }
6639       /* Any other register is bad.  */
6640       if (i.types[op].bitfield.class == Reg
6641           || i.types[op].bitfield.class == RegMMX
6642           || i.types[op].bitfield.class == RegSIMD
6643           || i.types[op].bitfield.class == SReg
6644           || i.types[op].bitfield.class == RegCR
6645           || i.types[op].bitfield.class == RegDR
6646           || i.types[op].bitfield.class == RegTR)
6647         {
6648           as_bad (_("`%s%s' not allowed with `%s%c'"),
6649                   register_prefix,
6650                   i.op[op].regs->reg_name,
6651                   i.tm.name,
6652                   i.suffix);
6653           return 0;
6654         }
6655     }
6656   return 1;
6657 }
6658
6659 static int
6660 check_long_reg (void)
6661 {
6662   int op;
6663
6664   for (op = i.operands; --op >= 0;)
6665     /* Skip non-register operands. */
6666     if (i.types[op].bitfield.class != Reg)
6667       continue;
6668     /* Reject eight bit registers, except where the template requires
6669        them. (eg. movzb)  */
6670     else if (i.types[op].bitfield.byte
6671              && (i.tm.operand_types[op].bitfield.class == Reg
6672                  || i.tm.operand_types[op].bitfield.instance == Accum)
6673              && (i.tm.operand_types[op].bitfield.word
6674                  || i.tm.operand_types[op].bitfield.dword))
6675       {
6676         as_bad (_("`%s%s' not allowed with `%s%c'"),
6677                 register_prefix,
6678                 i.op[op].regs->reg_name,
6679                 i.tm.name,
6680                 i.suffix);
6681         return 0;
6682       }
6683     /* Error if the e prefix on a general reg is missing.  */
6684     else if (i.types[op].bitfield.word
6685              && (i.tm.operand_types[op].bitfield.class == Reg
6686                  || i.tm.operand_types[op].bitfield.instance == Accum)
6687              && i.tm.operand_types[op].bitfield.dword)
6688       {
6689         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6690                 register_prefix, i.op[op].regs->reg_name,
6691                 i.suffix);
6692         return 0;
6693       }
6694     /* Warn if the r prefix on a general reg is present.  */
6695     else if (i.types[op].bitfield.qword
6696              && (i.tm.operand_types[op].bitfield.class == Reg
6697                  || i.tm.operand_types[op].bitfield.instance == Accum)
6698              && i.tm.operand_types[op].bitfield.dword)
6699       {
6700         if (intel_syntax
6701             && (i.tm.opcode_modifier.toqword
6702                 /* Also convert to QWORD for MOVSXD.  */
6703                 || i.tm.base_opcode == 0x63)
6704             && i.types[0].bitfield.class != RegSIMD)
6705           {
6706             /* Convert to QWORD.  We want REX byte. */
6707             i.suffix = QWORD_MNEM_SUFFIX;
6708           }
6709         else
6710           {
6711             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6712                     register_prefix, i.op[op].regs->reg_name,
6713                     i.suffix);
6714             return 0;
6715           }
6716       }
6717   return 1;
6718 }
6719
6720 static int
6721 check_qword_reg (void)
6722 {
6723   int op;
6724
6725   for (op = i.operands; --op >= 0; )
6726     /* Skip non-register operands. */
6727     if (i.types[op].bitfield.class != Reg)
6728       continue;
6729     /* Reject eight bit registers, except where the template requires
6730        them. (eg. movzb)  */
6731     else if (i.types[op].bitfield.byte
6732              && (i.tm.operand_types[op].bitfield.class == Reg
6733                  || i.tm.operand_types[op].bitfield.instance == Accum)
6734              && (i.tm.operand_types[op].bitfield.word
6735                  || i.tm.operand_types[op].bitfield.dword))
6736       {
6737         as_bad (_("`%s%s' not allowed with `%s%c'"),
6738                 register_prefix,
6739                 i.op[op].regs->reg_name,
6740                 i.tm.name,
6741                 i.suffix);
6742         return 0;
6743       }
6744     /* Warn if the r prefix on a general reg is missing.  */
6745     else if ((i.types[op].bitfield.word
6746               || i.types[op].bitfield.dword)
6747              && (i.tm.operand_types[op].bitfield.class == Reg
6748                  || i.tm.operand_types[op].bitfield.instance == Accum)
6749              && i.tm.operand_types[op].bitfield.qword)
6750       {
6751         /* Prohibit these changes in the 64bit mode, since the
6752            lowering is more complicated.  */
6753         if (intel_syntax
6754             && i.tm.opcode_modifier.todword
6755             && i.types[0].bitfield.class != RegSIMD)
6756           {
6757             /* Convert to DWORD.  We don't want REX byte. */
6758             i.suffix = LONG_MNEM_SUFFIX;
6759           }
6760         else
6761           {
6762             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6763                     register_prefix, i.op[op].regs->reg_name,
6764                     i.suffix);
6765             return 0;
6766           }
6767       }
6768   return 1;
6769 }
6770
6771 static int
6772 check_word_reg (void)
6773 {
6774   int op;
6775   for (op = i.operands; --op >= 0;)
6776     /* Skip non-register operands. */
6777     if (i.types[op].bitfield.class != Reg)
6778       continue;
6779     /* Reject eight bit registers, except where the template requires
6780        them. (eg. movzb)  */
6781     else if (i.types[op].bitfield.byte
6782              && (i.tm.operand_types[op].bitfield.class == Reg
6783                  || i.tm.operand_types[op].bitfield.instance == Accum)
6784              && (i.tm.operand_types[op].bitfield.word
6785                  || i.tm.operand_types[op].bitfield.dword))
6786       {
6787         as_bad (_("`%s%s' not allowed with `%s%c'"),
6788                 register_prefix,
6789                 i.op[op].regs->reg_name,
6790                 i.tm.name,
6791                 i.suffix);
6792         return 0;
6793       }
6794     /* Warn if the e or r prefix on a general reg is present.  */
6795     else if ((!quiet_warnings || flag_code == CODE_64BIT)
6796              && (i.types[op].bitfield.dword
6797                  || i.types[op].bitfield.qword)
6798              && (i.tm.operand_types[op].bitfield.class == Reg
6799                  || i.tm.operand_types[op].bitfield.instance == Accum)
6800              && i.tm.operand_types[op].bitfield.word)
6801       {
6802         /* Prohibit these changes in the 64bit mode, since the
6803            lowering is more complicated.  */
6804         if (flag_code == CODE_64BIT)
6805           {
6806             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6807                     register_prefix, i.op[op].regs->reg_name,
6808                     i.suffix);
6809             return 0;
6810           }
6811 #if REGISTER_WARNINGS
6812         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6813                  register_prefix,
6814                  (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6815                  register_prefix, i.op[op].regs->reg_name, i.suffix);
6816 #endif
6817       }
6818   return 1;
6819 }
6820
6821 static int
6822 update_imm (unsigned int j)
6823 {
6824   i386_operand_type overlap = i.types[j];
6825   if ((overlap.bitfield.imm8
6826        || overlap.bitfield.imm8s
6827        || overlap.bitfield.imm16
6828        || overlap.bitfield.imm32
6829        || overlap.bitfield.imm32s
6830        || overlap.bitfield.imm64)
6831       && !operand_type_equal (&overlap, &imm8)
6832       && !operand_type_equal (&overlap, &imm8s)
6833       && !operand_type_equal (&overlap, &imm16)
6834       && !operand_type_equal (&overlap, &imm32)
6835       && !operand_type_equal (&overlap, &imm32s)
6836       && !operand_type_equal (&overlap, &imm64))
6837     {
6838       if (i.suffix)
6839         {
6840           i386_operand_type temp;
6841
6842           operand_type_set (&temp, 0);
6843           if (i.suffix == BYTE_MNEM_SUFFIX)
6844             {
6845               temp.bitfield.imm8 = overlap.bitfield.imm8;
6846               temp.bitfield.imm8s = overlap.bitfield.imm8s;
6847             }
6848           else if (i.suffix == WORD_MNEM_SUFFIX)
6849             temp.bitfield.imm16 = overlap.bitfield.imm16;
6850           else if (i.suffix == QWORD_MNEM_SUFFIX)
6851             {
6852               temp.bitfield.imm64 = overlap.bitfield.imm64;
6853               temp.bitfield.imm32s = overlap.bitfield.imm32s;
6854             }
6855           else
6856             temp.bitfield.imm32 = overlap.bitfield.imm32;
6857           overlap = temp;
6858         }
6859       else if (operand_type_equal (&overlap, &imm16_32_32s)
6860                || operand_type_equal (&overlap, &imm16_32)
6861                || operand_type_equal (&overlap, &imm16_32s))
6862         {
6863           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6864             overlap = imm16;
6865           else
6866             overlap = imm32s;
6867         }
6868       if (!operand_type_equal (&overlap, &imm8)
6869           && !operand_type_equal (&overlap, &imm8s)
6870           && !operand_type_equal (&overlap, &imm16)
6871           && !operand_type_equal (&overlap, &imm32)
6872           && !operand_type_equal (&overlap, &imm32s)
6873           && !operand_type_equal (&overlap, &imm64))
6874         {
6875           as_bad (_("no instruction mnemonic suffix given; "
6876                     "can't determine immediate size"));
6877           return 0;
6878         }
6879     }
6880   i.types[j] = overlap;
6881
6882   return 1;
6883 }
6884
6885 static int
6886 finalize_imm (void)
6887 {
6888   unsigned int j, n;
6889
6890   /* Update the first 2 immediate operands.  */
6891   n = i.operands > 2 ? 2 : i.operands;
6892   if (n)
6893     {
6894       for (j = 0; j < n; j++)
6895         if (update_imm (j) == 0)
6896           return 0;
6897
6898       /* The 3rd operand can't be immediate operand.  */
6899       gas_assert (operand_type_check (i.types[2], imm) == 0);
6900     }
6901
6902   return 1;
6903 }
6904
6905 static int
6906 process_operands (void)
6907 {
6908   /* Default segment register this instruction will use for memory
6909      accesses.  0 means unknown.  This is only for optimizing out
6910      unnecessary segment overrides.  */
6911   const seg_entry *default_seg = 0;
6912
6913   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6914     {
6915       unsigned int dupl = i.operands;
6916       unsigned int dest = dupl - 1;
6917       unsigned int j;
6918
6919       /* The destination must be an xmm register.  */
6920       gas_assert (i.reg_operands
6921                   && MAX_OPERANDS > dupl
6922                   && operand_type_equal (&i.types[dest], &regxmm));
6923
6924       if (i.tm.operand_types[0].bitfield.instance == Accum
6925           && i.tm.operand_types[0].bitfield.xmmword)
6926         {
6927           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6928             {
6929               /* Keep xmm0 for instructions with VEX prefix and 3
6930                  sources.  */
6931               i.tm.operand_types[0].bitfield.instance = InstanceNone;
6932               i.tm.operand_types[0].bitfield.class = RegSIMD;
6933               goto duplicate;
6934             }
6935           else
6936             {
6937               /* We remove the first xmm0 and keep the number of
6938                  operands unchanged, which in fact duplicates the
6939                  destination.  */
6940               for (j = 1; j < i.operands; j++)
6941                 {
6942                   i.op[j - 1] = i.op[j];
6943                   i.types[j - 1] = i.types[j];
6944                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6945                   i.flags[j - 1] = i.flags[j];
6946                 }
6947             }
6948         }
6949       else if (i.tm.opcode_modifier.implicit1stxmm0)
6950         {
6951           gas_assert ((MAX_OPERANDS - 1) > dupl
6952                       && (i.tm.opcode_modifier.vexsources
6953                           == VEX3SOURCES));
6954
6955           /* Add the implicit xmm0 for instructions with VEX prefix
6956              and 3 sources.  */
6957           for (j = i.operands; j > 0; j--)
6958             {
6959               i.op[j] = i.op[j - 1];
6960               i.types[j] = i.types[j - 1];
6961               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6962               i.flags[j] = i.flags[j - 1];
6963             }
6964           i.op[0].regs
6965             = (const reg_entry *) hash_find (reg_hash, "xmm0");
6966           i.types[0] = regxmm;
6967           i.tm.operand_types[0] = regxmm;
6968
6969           i.operands += 2;
6970           i.reg_operands += 2;
6971           i.tm.operands += 2;
6972
6973           dupl++;
6974           dest++;
6975           i.op[dupl] = i.op[dest];
6976           i.types[dupl] = i.types[dest];
6977           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6978           i.flags[dupl] = i.flags[dest];
6979         }
6980       else
6981         {
6982 duplicate:
6983           i.operands++;
6984           i.reg_operands++;
6985           i.tm.operands++;
6986
6987           i.op[dupl] = i.op[dest];
6988           i.types[dupl] = i.types[dest];
6989           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6990           i.flags[dupl] = i.flags[dest];
6991         }
6992
6993        if (i.tm.opcode_modifier.immext)
6994          process_immext ();
6995     }
6996   else if (i.tm.operand_types[0].bitfield.instance == Accum
6997            && i.tm.operand_types[0].bitfield.xmmword)
6998     {
6999       unsigned int j;
7000
7001       for (j = 1; j < i.operands; j++)
7002         {
7003           i.op[j - 1] = i.op[j];
7004           i.types[j - 1] = i.types[j];
7005
7006           /* We need to adjust fields in i.tm since they are used by
7007              build_modrm_byte.  */
7008           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7009
7010           i.flags[j - 1] = i.flags[j];
7011         }
7012
7013       i.operands--;
7014       i.reg_operands--;
7015       i.tm.operands--;
7016     }
7017   else if (i.tm.opcode_modifier.implicitquadgroup)
7018     {
7019       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7020
7021       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7022       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7023       regnum = register_number (i.op[1].regs);
7024       first_reg_in_group = regnum & ~3;
7025       last_reg_in_group = first_reg_in_group + 3;
7026       if (regnum != first_reg_in_group)
7027         as_warn (_("source register `%s%s' implicitly denotes"
7028                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7029                  register_prefix, i.op[1].regs->reg_name,
7030                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7031                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7032                  i.tm.name);
7033     }
7034   else if (i.tm.opcode_modifier.regkludge)
7035     {
7036       /* The imul $imm, %reg instruction is converted into
7037          imul $imm, %reg, %reg, and the clr %reg instruction
7038          is converted into xor %reg, %reg.  */
7039
7040       unsigned int first_reg_op;
7041
7042       if (operand_type_check (i.types[0], reg))
7043         first_reg_op = 0;
7044       else
7045         first_reg_op = 1;
7046       /* Pretend we saw the extra register operand.  */
7047       gas_assert (i.reg_operands == 1
7048                   && i.op[first_reg_op + 1].regs == 0);
7049       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7050       i.types[first_reg_op + 1] = i.types[first_reg_op];
7051       i.operands++;
7052       i.reg_operands++;
7053     }
7054
7055   if (i.tm.opcode_modifier.modrm)
7056     {
7057       /* The opcode is completed (modulo i.tm.extension_opcode which
7058          must be put into the modrm byte).  Now, we make the modrm and
7059          index base bytes based on all the info we've collected.  */
7060
7061       default_seg = build_modrm_byte ();
7062     }
7063   else if (i.types[0].bitfield.class == SReg)
7064     {
7065       if (flag_code != CODE_64BIT
7066           ? i.tm.base_opcode == POP_SEG_SHORT
7067             && i.op[0].regs->reg_num == 1
7068           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7069             && i.op[0].regs->reg_num < 4)
7070         {
7071           as_bad (_("you can't `%s %s%s'"),
7072                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7073           return 0;
7074         }
7075       if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7076         {
7077           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7078           i.tm.opcode_length = 2;
7079         }
7080       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7081     }
7082   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7083     {
7084       default_seg = &ds;
7085     }
7086   else if (i.tm.opcode_modifier.isstring)
7087     {
7088       /* For the string instructions that allow a segment override
7089          on one of their operands, the default segment is ds.  */
7090       default_seg = &ds;
7091     }
7092   else if (i.tm.opcode_modifier.shortform)
7093     {
7094       /* The register or float register operand is in operand
7095          0 or 1.  */
7096       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7097
7098       /* Register goes in low 3 bits of opcode.  */
7099       i.tm.base_opcode |= i.op[op].regs->reg_num;
7100       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7101         i.rex |= REX_B;
7102       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7103         {
7104           /* Warn about some common errors, but press on regardless.
7105              The first case can be generated by gcc (<= 2.8.1).  */
7106           if (i.operands == 2)
7107             {
7108               /* Reversed arguments on faddp, fsubp, etc.  */
7109               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7110                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7111                        register_prefix, i.op[intel_syntax].regs->reg_name);
7112             }
7113           else
7114             {
7115               /* Extraneous `l' suffix on fp insn.  */
7116               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7117                        register_prefix, i.op[0].regs->reg_name);
7118             }
7119         }
7120     }
7121
7122   if (i.tm.base_opcode == 0x8d /* lea */
7123       && i.seg[0]
7124       && !quiet_warnings)
7125     as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7126
7127   /* If a segment was explicitly specified, and the specified segment
7128      is not the default, use an opcode prefix to select it.  If we
7129      never figured out what the default segment is, then default_seg
7130      will be zero at this point, and the specified segment prefix will
7131      always be used.  */
7132   if ((i.seg[0]) && (i.seg[0] != default_seg))
7133     {
7134       if (!add_prefix (i.seg[0]->seg_prefix))
7135         return 0;
7136     }
7137   return 1;
7138 }
7139
7140 static const seg_entry *
7141 build_modrm_byte (void)
7142 {
7143   const seg_entry *default_seg = 0;
7144   unsigned int source, dest;
7145   int vex_3_sources;
7146
7147   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7148   if (vex_3_sources)
7149     {
7150       unsigned int nds, reg_slot;
7151       expressionS *exp;
7152
7153       dest = i.operands - 1;
7154       nds = dest - 1;
7155
7156       /* There are 2 kinds of instructions:
7157          1. 5 operands: 4 register operands or 3 register operands
7158          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7159          VexW0 or VexW1.  The destination must be either XMM, YMM or
7160          ZMM register.
7161          2. 4 operands: 4 register operands or 3 register operands
7162          plus 1 memory operand, with VexXDS.  */
7163       gas_assert ((i.reg_operands == 4
7164                    || (i.reg_operands == 3 && i.mem_operands == 1))
7165                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7166                   && i.tm.opcode_modifier.vexw
7167                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7168
7169       /* If VexW1 is set, the first non-immediate operand is the source and
7170          the second non-immediate one is encoded in the immediate operand.  */
7171       if (i.tm.opcode_modifier.vexw == VEXW1)
7172         {
7173           source = i.imm_operands;
7174           reg_slot = i.imm_operands + 1;
7175         }
7176       else
7177         {
7178           source = i.imm_operands + 1;
7179           reg_slot = i.imm_operands;
7180         }
7181
7182       if (i.imm_operands == 0)
7183         {
7184           /* When there is no immediate operand, generate an 8bit
7185              immediate operand to encode the first operand.  */
7186           exp = &im_expressions[i.imm_operands++];
7187           i.op[i.operands].imms = exp;
7188           i.types[i.operands] = imm8;
7189           i.operands++;
7190
7191           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7192           exp->X_op = O_constant;
7193           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7194           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7195         }
7196       else
7197         {
7198           gas_assert (i.imm_operands == 1);
7199           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7200           gas_assert (!i.tm.opcode_modifier.immext);
7201
7202           /* Turn on Imm8 again so that output_imm will generate it.  */
7203           i.types[0].bitfield.imm8 = 1;
7204
7205           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7206           i.op[0].imms->X_add_number
7207               |= register_number (i.op[reg_slot].regs) << 4;
7208           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7209         }
7210
7211       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7212       i.vex.register_specifier = i.op[nds].regs;
7213     }
7214   else
7215     source = dest = 0;
7216
7217   /* i.reg_operands MUST be the number of real register operands;
7218      implicit registers do not count.  If there are 3 register
7219      operands, it must be a instruction with VexNDS.  For a
7220      instruction with VexNDD, the destination register is encoded
7221      in VEX prefix.  If there are 4 register operands, it must be
7222      a instruction with VEX prefix and 3 sources.  */
7223   if (i.mem_operands == 0
7224       && ((i.reg_operands == 2
7225            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7226           || (i.reg_operands == 3
7227               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7228           || (i.reg_operands == 4 && vex_3_sources)))
7229     {
7230       switch (i.operands)
7231         {
7232         case 2:
7233           source = 0;
7234           break;
7235         case 3:
7236           /* When there are 3 operands, one of them may be immediate,
7237              which may be the first or the last operand.  Otherwise,
7238              the first operand must be shift count register (cl) or it
7239              is an instruction with VexNDS. */
7240           gas_assert (i.imm_operands == 1
7241                       || (i.imm_operands == 0
7242                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7243                               || (i.types[0].bitfield.instance == RegC
7244                                   && i.types[0].bitfield.byte))));
7245           if (operand_type_check (i.types[0], imm)
7246               || (i.types[0].bitfield.instance == RegC
7247                   && i.types[0].bitfield.byte))
7248             source = 1;
7249           else
7250             source = 0;
7251           break;
7252         case 4:
7253           /* When there are 4 operands, the first two must be 8bit
7254              immediate operands. The source operand will be the 3rd
7255              one.
7256
7257              For instructions with VexNDS, if the first operand
7258              an imm8, the source operand is the 2nd one.  If the last
7259              operand is imm8, the source operand is the first one.  */
7260           gas_assert ((i.imm_operands == 2
7261                        && i.types[0].bitfield.imm8
7262                        && i.types[1].bitfield.imm8)
7263                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7264                           && i.imm_operands == 1
7265                           && (i.types[0].bitfield.imm8
7266                               || i.types[i.operands - 1].bitfield.imm8
7267                               || i.rounding)));
7268           if (i.imm_operands == 2)
7269             source = 2;
7270           else
7271             {
7272               if (i.types[0].bitfield.imm8)
7273                 source = 1;
7274               else
7275                 source = 0;
7276             }
7277           break;
7278         case 5:
7279           if (is_evex_encoding (&i.tm))
7280             {
7281               /* For EVEX instructions, when there are 5 operands, the
7282                  first one must be immediate operand.  If the second one
7283                  is immediate operand, the source operand is the 3th
7284                  one.  If the last one is immediate operand, the source
7285                  operand is the 2nd one.  */
7286               gas_assert (i.imm_operands == 2
7287                           && i.tm.opcode_modifier.sae
7288                           && operand_type_check (i.types[0], imm));
7289               if (operand_type_check (i.types[1], imm))
7290                 source = 2;
7291               else if (operand_type_check (i.types[4], imm))
7292                 source = 1;
7293               else
7294                 abort ();
7295             }
7296           break;
7297         default:
7298           abort ();
7299         }
7300
7301       if (!vex_3_sources)
7302         {
7303           dest = source + 1;
7304
7305           /* RC/SAE operand could be between DEST and SRC.  That happens
7306              when one operand is GPR and the other one is XMM/YMM/ZMM
7307              register.  */
7308           if (i.rounding && i.rounding->operand == (int) dest)
7309             dest++;
7310
7311           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7312             {
7313               /* For instructions with VexNDS, the register-only source
7314                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7315                  register.  It is encoded in VEX prefix.  */
7316
7317               i386_operand_type op;
7318               unsigned int vvvv;
7319
7320               /* Check register-only source operand when two source
7321                  operands are swapped.  */
7322               if (!i.tm.operand_types[source].bitfield.baseindex
7323                   && i.tm.operand_types[dest].bitfield.baseindex)
7324                 {
7325                   vvvv = source;
7326                   source = dest;
7327                 }
7328               else
7329                 vvvv = dest;
7330
7331               op = i.tm.operand_types[vvvv];
7332               if ((dest + 1) >= i.operands
7333                   || ((op.bitfield.class != Reg
7334                        || (!op.bitfield.dword && !op.bitfield.qword))
7335                       && op.bitfield.class != RegSIMD
7336                       && !operand_type_equal (&op, &regmask)))
7337                 abort ();
7338               i.vex.register_specifier = i.op[vvvv].regs;
7339               dest++;
7340             }
7341         }
7342
7343       i.rm.mode = 3;
7344       /* One of the register operands will be encoded in the i.rm.reg
7345          field, the other in the combined i.rm.mode and i.rm.regmem
7346          fields.  If no form of this instruction supports a memory
7347          destination operand, then we assume the source operand may
7348          sometimes be a memory operand and so we need to store the
7349          destination in the i.rm.reg field.  */
7350       if (!i.tm.opcode_modifier.regmem
7351           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7352         {
7353           i.rm.reg = i.op[dest].regs->reg_num;
7354           i.rm.regmem = i.op[source].regs->reg_num;
7355           if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7356                || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7357             i.has_regmmx = TRUE;
7358           else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7359                    || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7360             {
7361               if (i.types[dest].bitfield.zmmword
7362                   || i.types[source].bitfield.zmmword)
7363                 i.has_regzmm = TRUE;
7364               else if (i.types[dest].bitfield.ymmword
7365                        || i.types[source].bitfield.ymmword)
7366                 i.has_regymm = TRUE;
7367               else
7368                 i.has_regxmm = TRUE;
7369             }
7370           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7371             i.rex |= REX_R;
7372           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7373             i.vrex |= REX_R;
7374           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7375             i.rex |= REX_B;
7376           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7377             i.vrex |= REX_B;
7378         }
7379       else
7380         {
7381           i.rm.reg = i.op[source].regs->reg_num;
7382           i.rm.regmem = i.op[dest].regs->reg_num;
7383           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7384             i.rex |= REX_B;
7385           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7386             i.vrex |= REX_B;
7387           if ((i.op[source].regs->reg_flags & RegRex) != 0)
7388             i.rex |= REX_R;
7389           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7390             i.vrex |= REX_R;
7391         }
7392       if (flag_code != CODE_64BIT && (i.rex & REX_R))
7393         {
7394           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7395             abort ();
7396           i.rex &= ~REX_R;
7397           add_prefix (LOCK_PREFIX_OPCODE);
7398         }
7399     }
7400   else
7401     {                   /* If it's not 2 reg operands...  */
7402       unsigned int mem;
7403
7404       if (i.mem_operands)
7405         {
7406           unsigned int fake_zero_displacement = 0;
7407           unsigned int op;
7408
7409           for (op = 0; op < i.operands; op++)
7410             if (i.flags[op] & Operand_Mem)
7411               break;
7412           gas_assert (op < i.operands);
7413
7414           if (i.tm.opcode_modifier.vecsib)
7415             {
7416               if (i.index_reg->reg_num == RegIZ)
7417                 abort ();
7418
7419               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7420               if (!i.base_reg)
7421                 {
7422                   i.sib.base = NO_BASE_REGISTER;
7423                   i.sib.scale = i.log2_scale_factor;
7424                   i.types[op].bitfield.disp8 = 0;
7425                   i.types[op].bitfield.disp16 = 0;
7426                   i.types[op].bitfield.disp64 = 0;
7427                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7428                     {
7429                       /* Must be 32 bit */
7430                       i.types[op].bitfield.disp32 = 1;
7431                       i.types[op].bitfield.disp32s = 0;
7432                     }
7433                   else
7434                     {
7435                       i.types[op].bitfield.disp32 = 0;
7436                       i.types[op].bitfield.disp32s = 1;
7437                     }
7438                 }
7439               i.sib.index = i.index_reg->reg_num;
7440               if ((i.index_reg->reg_flags & RegRex) != 0)
7441                 i.rex |= REX_X;
7442               if ((i.index_reg->reg_flags & RegVRex) != 0)
7443                 i.vrex |= REX_X;
7444             }
7445
7446           default_seg = &ds;
7447
7448           if (i.base_reg == 0)
7449             {
7450               i.rm.mode = 0;
7451               if (!i.disp_operands)
7452                 fake_zero_displacement = 1;
7453               if (i.index_reg == 0)
7454                 {
7455                   i386_operand_type newdisp;
7456
7457                   gas_assert (!i.tm.opcode_modifier.vecsib);
7458                   /* Operand is just <disp>  */
7459                   if (flag_code == CODE_64BIT)
7460                     {
7461                       /* 64bit mode overwrites the 32bit absolute
7462                          addressing by RIP relative addressing and
7463                          absolute addressing is encoded by one of the
7464                          redundant SIB forms.  */
7465                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7466                       i.sib.base = NO_BASE_REGISTER;
7467                       i.sib.index = NO_INDEX_REGISTER;
7468                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7469                     }
7470                   else if ((flag_code == CODE_16BIT)
7471                            ^ (i.prefix[ADDR_PREFIX] != 0))
7472                     {
7473                       i.rm.regmem = NO_BASE_REGISTER_16;
7474                       newdisp = disp16;
7475                     }
7476                   else
7477                     {
7478                       i.rm.regmem = NO_BASE_REGISTER;
7479                       newdisp = disp32;
7480                     }
7481                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
7482                   i.types[op] = operand_type_or (i.types[op], newdisp);
7483                 }
7484               else if (!i.tm.opcode_modifier.vecsib)
7485                 {
7486                   /* !i.base_reg && i.index_reg  */
7487                   if (i.index_reg->reg_num == RegIZ)
7488                     i.sib.index = NO_INDEX_REGISTER;
7489                   else
7490                     i.sib.index = i.index_reg->reg_num;
7491                   i.sib.base = NO_BASE_REGISTER;
7492                   i.sib.scale = i.log2_scale_factor;
7493                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7494                   i.types[op].bitfield.disp8 = 0;
7495                   i.types[op].bitfield.disp16 = 0;
7496                   i.types[op].bitfield.disp64 = 0;
7497                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7498                     {
7499                       /* Must be 32 bit */
7500                       i.types[op].bitfield.disp32 = 1;
7501                       i.types[op].bitfield.disp32s = 0;
7502                     }
7503                   else
7504                     {
7505                       i.types[op].bitfield.disp32 = 0;
7506                       i.types[op].bitfield.disp32s = 1;
7507                     }
7508                   if ((i.index_reg->reg_flags & RegRex) != 0)
7509                     i.rex |= REX_X;
7510                 }
7511             }
7512           /* RIP addressing for 64bit mode.  */
7513           else if (i.base_reg->reg_num == RegIP)
7514             {
7515               gas_assert (!i.tm.opcode_modifier.vecsib);
7516               i.rm.regmem = NO_BASE_REGISTER;
7517               i.types[op].bitfield.disp8 = 0;
7518               i.types[op].bitfield.disp16 = 0;
7519               i.types[op].bitfield.disp32 = 0;
7520               i.types[op].bitfield.disp32s = 1;
7521               i.types[op].bitfield.disp64 = 0;
7522               i.flags[op] |= Operand_PCrel;
7523               if (! i.disp_operands)
7524                 fake_zero_displacement = 1;
7525             }
7526           else if (i.base_reg->reg_type.bitfield.word)
7527             {
7528               gas_assert (!i.tm.opcode_modifier.vecsib);
7529               switch (i.base_reg->reg_num)
7530                 {
7531                 case 3: /* (%bx)  */
7532                   if (i.index_reg == 0)
7533                     i.rm.regmem = 7;
7534                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
7535                     i.rm.regmem = i.index_reg->reg_num - 6;
7536                   break;
7537                 case 5: /* (%bp)  */
7538                   default_seg = &ss;
7539                   if (i.index_reg == 0)
7540                     {
7541                       i.rm.regmem = 6;
7542                       if (operand_type_check (i.types[op], disp) == 0)
7543                         {
7544                           /* fake (%bp) into 0(%bp)  */
7545                           i.types[op].bitfield.disp8 = 1;
7546                           fake_zero_displacement = 1;
7547                         }
7548                     }
7549                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
7550                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7551                   break;
7552                 default: /* (%si) -> 4 or (%di) -> 5  */
7553                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7554                 }
7555               i.rm.mode = mode_from_disp_size (i.types[op]);
7556             }
7557           else /* i.base_reg and 32/64 bit mode  */
7558             {
7559               if (flag_code == CODE_64BIT
7560                   && operand_type_check (i.types[op], disp))
7561                 {
7562                   i.types[op].bitfield.disp16 = 0;
7563                   i.types[op].bitfield.disp64 = 0;
7564                   if (i.prefix[ADDR_PREFIX] == 0)
7565                     {
7566                       i.types[op].bitfield.disp32 = 0;
7567                       i.types[op].bitfield.disp32s = 1;
7568                     }
7569                   else
7570                     {
7571                       i.types[op].bitfield.disp32 = 1;
7572                       i.types[op].bitfield.disp32s = 0;
7573                     }
7574                 }
7575
7576               if (!i.tm.opcode_modifier.vecsib)
7577                 i.rm.regmem = i.base_reg->reg_num;
7578               if ((i.base_reg->reg_flags & RegRex) != 0)
7579                 i.rex |= REX_B;
7580               i.sib.base = i.base_reg->reg_num;
7581               /* x86-64 ignores REX prefix bit here to avoid decoder
7582                  complications.  */
7583               if (!(i.base_reg->reg_flags & RegRex)
7584                   && (i.base_reg->reg_num == EBP_REG_NUM
7585                    || i.base_reg->reg_num == ESP_REG_NUM))
7586                   default_seg = &ss;
7587               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7588                 {
7589                   fake_zero_displacement = 1;
7590                   i.types[op].bitfield.disp8 = 1;
7591                 }
7592               i.sib.scale = i.log2_scale_factor;
7593               if (i.index_reg == 0)
7594                 {
7595                   gas_assert (!i.tm.opcode_modifier.vecsib);
7596                   /* <disp>(%esp) becomes two byte modrm with no index
7597                      register.  We've already stored the code for esp
7598                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7599                      Any base register besides %esp will not use the
7600                      extra modrm byte.  */
7601                   i.sib.index = NO_INDEX_REGISTER;
7602                 }
7603               else if (!i.tm.opcode_modifier.vecsib)
7604                 {
7605                   if (i.index_reg->reg_num == RegIZ)
7606                     i.sib.index = NO_INDEX_REGISTER;
7607                   else
7608                     i.sib.index = i.index_reg->reg_num;
7609                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7610                   if ((i.index_reg->reg_flags & RegRex) != 0)
7611                     i.rex |= REX_X;
7612                 }
7613
7614               if (i.disp_operands
7615                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7616                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7617                 i.rm.mode = 0;
7618               else
7619                 {
7620                   if (!fake_zero_displacement
7621                       && !i.disp_operands
7622                       && i.disp_encoding)
7623                     {
7624                       fake_zero_displacement = 1;
7625                       if (i.disp_encoding == disp_encoding_8bit)
7626                         i.types[op].bitfield.disp8 = 1;
7627                       else
7628                         i.types[op].bitfield.disp32 = 1;
7629                     }
7630                   i.rm.mode = mode_from_disp_size (i.types[op]);
7631                 }
7632             }
7633
7634           if (fake_zero_displacement)
7635             {
7636               /* Fakes a zero displacement assuming that i.types[op]
7637                  holds the correct displacement size.  */
7638               expressionS *exp;
7639
7640               gas_assert (i.op[op].disps == 0);
7641               exp = &disp_expressions[i.disp_operands++];
7642               i.op[op].disps = exp;
7643               exp->X_op = O_constant;
7644               exp->X_add_number = 0;
7645               exp->X_add_symbol = (symbolS *) 0;
7646               exp->X_op_symbol = (symbolS *) 0;
7647             }
7648
7649           mem = op;
7650         }
7651       else
7652         mem = ~0;
7653
7654       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7655         {
7656           if (operand_type_check (i.types[0], imm))
7657             i.vex.register_specifier = NULL;
7658           else
7659             {
7660               /* VEX.vvvv encodes one of the sources when the first
7661                  operand is not an immediate.  */
7662               if (i.tm.opcode_modifier.vexw == VEXW0)
7663                 i.vex.register_specifier = i.op[0].regs;
7664               else
7665                 i.vex.register_specifier = i.op[1].regs;
7666             }
7667
7668           /* Destination is a XMM register encoded in the ModRM.reg
7669              and VEX.R bit.  */
7670           i.rm.reg = i.op[2].regs->reg_num;
7671           if ((i.op[2].regs->reg_flags & RegRex) != 0)
7672             i.rex |= REX_R;
7673
7674           /* ModRM.rm and VEX.B encodes the other source.  */
7675           if (!i.mem_operands)
7676             {
7677               i.rm.mode = 3;
7678
7679               if (i.tm.opcode_modifier.vexw == VEXW0)
7680                 i.rm.regmem = i.op[1].regs->reg_num;
7681               else
7682                 i.rm.regmem = i.op[0].regs->reg_num;
7683
7684               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7685                 i.rex |= REX_B;
7686             }
7687         }
7688       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7689         {
7690           i.vex.register_specifier = i.op[2].regs;
7691           if (!i.mem_operands)
7692             {
7693               i.rm.mode = 3;
7694               i.rm.regmem = i.op[1].regs->reg_num;
7695               if ((i.op[1].regs->reg_flags & RegRex) != 0)
7696                 i.rex |= REX_B;
7697             }
7698         }
7699       /* Fill in i.rm.reg or i.rm.regmem field with register operand
7700          (if any) based on i.tm.extension_opcode.  Again, we must be
7701          careful to make sure that segment/control/debug/test/MMX
7702          registers are coded into the i.rm.reg field.  */
7703       else if (i.reg_operands)
7704         {
7705           unsigned int op;
7706           unsigned int vex_reg = ~0;
7707
7708           for (op = 0; op < i.operands; op++)
7709             {
7710               if (i.types[op].bitfield.class == Reg
7711                   || i.types[op].bitfield.class == RegBND
7712                   || i.types[op].bitfield.class == RegMask
7713                   || i.types[op].bitfield.class == SReg
7714                   || i.types[op].bitfield.class == RegCR
7715                   || i.types[op].bitfield.class == RegDR
7716                   || i.types[op].bitfield.class == RegTR)
7717                 break;
7718               if (i.types[op].bitfield.class == RegSIMD)
7719                 {
7720                   if (i.types[op].bitfield.zmmword)
7721                     i.has_regzmm = TRUE;
7722                   else if (i.types[op].bitfield.ymmword)
7723                     i.has_regymm = TRUE;
7724                   else
7725                     i.has_regxmm = TRUE;
7726                   break;
7727                 }
7728               if (i.types[op].bitfield.class == RegMMX)
7729                 {
7730                   i.has_regmmx = TRUE;
7731                   break;
7732                 }
7733             }
7734
7735           if (vex_3_sources)
7736             op = dest;
7737           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7738             {
7739               /* For instructions with VexNDS, the register-only
7740                  source operand is encoded in VEX prefix. */
7741               gas_assert (mem != (unsigned int) ~0);
7742
7743               if (op > mem)
7744                 {
7745                   vex_reg = op++;
7746                   gas_assert (op < i.operands);
7747                 }
7748               else
7749                 {
7750                   /* Check register-only source operand when two source
7751                      operands are swapped.  */
7752                   if (!i.tm.operand_types[op].bitfield.baseindex
7753                       && i.tm.operand_types[op + 1].bitfield.baseindex)
7754                     {
7755                       vex_reg = op;
7756                       op += 2;
7757                       gas_assert (mem == (vex_reg + 1)
7758                                   && op < i.operands);
7759                     }
7760                   else
7761                     {
7762                       vex_reg = op + 1;
7763                       gas_assert (vex_reg < i.operands);
7764                     }
7765                 }
7766             }
7767           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7768             {
7769               /* For instructions with VexNDD, the register destination
7770                  is encoded in VEX prefix.  */
7771               if (i.mem_operands == 0)
7772                 {
7773                   /* There is no memory operand.  */
7774                   gas_assert ((op + 2) == i.operands);
7775                   vex_reg = op + 1;
7776                 }
7777               else
7778                 {
7779                   /* There are only 2 non-immediate operands.  */
7780                   gas_assert (op < i.imm_operands + 2
7781                               && i.operands == i.imm_operands + 2);
7782                   vex_reg = i.imm_operands + 1;
7783                 }
7784             }
7785           else
7786             gas_assert (op < i.operands);
7787
7788           if (vex_reg != (unsigned int) ~0)
7789             {
7790               i386_operand_type *type = &i.tm.operand_types[vex_reg];
7791
7792               if ((type->bitfield.class != Reg
7793                    || (!type->bitfield.dword && !type->bitfield.qword))
7794                   && type->bitfield.class != RegSIMD
7795                   && !operand_type_equal (type, &regmask))
7796                 abort ();
7797
7798               i.vex.register_specifier = i.op[vex_reg].regs;
7799             }
7800
7801           /* Don't set OP operand twice.  */
7802           if (vex_reg != op)
7803             {
7804               /* If there is an extension opcode to put here, the
7805                  register number must be put into the regmem field.  */
7806               if (i.tm.extension_opcode != None)
7807                 {
7808                   i.rm.regmem = i.op[op].regs->reg_num;
7809                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7810                     i.rex |= REX_B;
7811                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7812                     i.vrex |= REX_B;
7813                 }
7814               else
7815                 {
7816                   i.rm.reg = i.op[op].regs->reg_num;
7817                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
7818                     i.rex |= REX_R;
7819                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7820                     i.vrex |= REX_R;
7821                 }
7822             }
7823
7824           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7825              must set it to 3 to indicate this is a register operand
7826              in the regmem field.  */
7827           if (!i.mem_operands)
7828             i.rm.mode = 3;
7829         }
7830
7831       /* Fill in i.rm.reg field with extension opcode (if any).  */
7832       if (i.tm.extension_opcode != None)
7833         i.rm.reg = i.tm.extension_opcode;
7834     }
7835   return default_seg;
7836 }
7837
7838 static unsigned int
7839 flip_code16 (unsigned int code16)
7840 {
7841   gas_assert (i.tm.operands == 1);
7842
7843   return !(i.prefix[REX_PREFIX] & REX_W)
7844          && (code16 ? i.tm.operand_types[0].bitfield.disp32
7845                       || i.tm.operand_types[0].bitfield.disp32s
7846                     : i.tm.operand_types[0].bitfield.disp16)
7847          ? CODE16 : 0;
7848 }
7849
7850 static void
7851 output_branch (void)
7852 {
7853   char *p;
7854   int size;
7855   int code16;
7856   int prefix;
7857   relax_substateT subtype;
7858   symbolS *sym;
7859   offsetT off;
7860
7861   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7862   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7863
7864   prefix = 0;
7865   if (i.prefix[DATA_PREFIX] != 0)
7866     {
7867       prefix = 1;
7868       i.prefixes -= 1;
7869       code16 ^= flip_code16(code16);
7870     }
7871   /* Pentium4 branch hints.  */
7872   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7873       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7874     {
7875       prefix++;
7876       i.prefixes--;
7877     }
7878   if (i.prefix[REX_PREFIX] != 0)
7879     {
7880       prefix++;
7881       i.prefixes--;
7882     }
7883
7884   /* BND prefixed jump.  */
7885   if (i.prefix[BND_PREFIX] != 0)
7886     {
7887       prefix++;
7888       i.prefixes--;
7889     }
7890
7891   if (i.prefixes != 0)
7892     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7893
7894   /* It's always a symbol;  End frag & setup for relax.
7895      Make sure there is enough room in this frag for the largest
7896      instruction we may generate in md_convert_frag.  This is 2
7897      bytes for the opcode and room for the prefix and largest
7898      displacement.  */
7899   frag_grow (prefix + 2 + 4);
7900   /* Prefix and 1 opcode byte go in fr_fix.  */
7901   p = frag_more (prefix + 1);
7902   if (i.prefix[DATA_PREFIX] != 0)
7903     *p++ = DATA_PREFIX_OPCODE;
7904   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7905       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7906     *p++ = i.prefix[SEG_PREFIX];
7907   if (i.prefix[BND_PREFIX] != 0)
7908     *p++ = BND_PREFIX_OPCODE;
7909   if (i.prefix[REX_PREFIX] != 0)
7910     *p++ = i.prefix[REX_PREFIX];
7911   *p = i.tm.base_opcode;
7912
7913   if ((unsigned char) *p == JUMP_PC_RELATIVE)
7914     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7915   else if (cpu_arch_flags.bitfield.cpui386)
7916     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7917   else
7918     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7919   subtype |= code16;
7920
7921   sym = i.op[0].disps->X_add_symbol;
7922   off = i.op[0].disps->X_add_number;
7923
7924   if (i.op[0].disps->X_op != O_constant
7925       && i.op[0].disps->X_op != O_symbol)
7926     {
7927       /* Handle complex expressions.  */
7928       sym = make_expr_symbol (i.op[0].disps);
7929       off = 0;
7930     }
7931
7932   /* 1 possible extra opcode + 4 byte displacement go in var part.
7933      Pass reloc in fr_var.  */
7934   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7935 }
7936
7937 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7938 /* Return TRUE iff PLT32 relocation should be used for branching to
7939    symbol S.  */
7940
7941 static bfd_boolean
7942 need_plt32_p (symbolS *s)
7943 {
7944   /* PLT32 relocation is ELF only.  */
7945   if (!IS_ELF)
7946     return FALSE;
7947
7948 #ifdef TE_SOLARIS
7949   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7950      krtld support it.  */
7951   return FALSE;
7952 #endif
7953
7954   /* Since there is no need to prepare for PLT branch on x86-64, we
7955      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7956      be used as a marker for 32-bit PC-relative branches.  */
7957   if (!object_64bit)
7958     return FALSE;
7959
7960   /* Weak or undefined symbol need PLT32 relocation.  */
7961   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7962     return TRUE;
7963
7964   /* Non-global symbol doesn't need PLT32 relocation.  */
7965   if (! S_IS_EXTERNAL (s))
7966     return FALSE;
7967
7968   /* Other global symbols need PLT32 relocation.  NB: Symbol with
7969      non-default visibilities are treated as normal global symbol
7970      so that PLT32 relocation can be used as a marker for 32-bit
7971      PC-relative branches.  It is useful for linker relaxation.  */
7972   return TRUE;
7973 }
7974 #endif
7975
7976 static void
7977 output_jump (void)
7978 {
7979   char *p;
7980   int size;
7981   fixS *fixP;
7982   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7983
7984   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
7985     {
7986       /* This is a loop or jecxz type instruction.  */
7987       size = 1;
7988       if (i.prefix[ADDR_PREFIX] != 0)
7989         {
7990           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7991           i.prefixes -= 1;
7992         }
7993       /* Pentium4 branch hints.  */
7994       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7995           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7996         {
7997           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7998           i.prefixes--;
7999         }
8000     }
8001   else
8002     {
8003       int code16;
8004
8005       code16 = 0;
8006       if (flag_code == CODE_16BIT)
8007         code16 = CODE16;
8008
8009       if (i.prefix[DATA_PREFIX] != 0)
8010         {
8011           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8012           i.prefixes -= 1;
8013           code16 ^= flip_code16(code16);
8014         }
8015
8016       size = 4;
8017       if (code16)
8018         size = 2;
8019     }
8020
8021   /* BND prefixed jump.  */
8022   if (i.prefix[BND_PREFIX] != 0)
8023     {
8024       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8025       i.prefixes -= 1;
8026     }
8027
8028   if (i.prefix[REX_PREFIX] != 0)
8029     {
8030       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8031       i.prefixes -= 1;
8032     }
8033
8034   if (i.prefixes != 0)
8035     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8036
8037   p = frag_more (i.tm.opcode_length + size);
8038   switch (i.tm.opcode_length)
8039     {
8040     case 2:
8041       *p++ = i.tm.base_opcode >> 8;
8042       /* Fall through.  */
8043     case 1:
8044       *p++ = i.tm.base_opcode;
8045       break;
8046     default:
8047       abort ();
8048     }
8049
8050 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8051   if (size == 4
8052       && jump_reloc == NO_RELOC
8053       && need_plt32_p (i.op[0].disps->X_add_symbol))
8054     jump_reloc = BFD_RELOC_X86_64_PLT32;
8055 #endif
8056
8057   jump_reloc = reloc (size, 1, 1, jump_reloc);
8058
8059   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8060                       i.op[0].disps, 1, jump_reloc);
8061
8062   /* All jumps handled here are signed, but don't use a signed limit
8063      check for 32 and 16 bit jumps as we want to allow wrap around at
8064      4G and 64k respectively.  */
8065   if (size == 1)
8066     fixP->fx_signed = 1;
8067 }
8068
8069 static void
8070 output_interseg_jump (void)
8071 {
8072   char *p;
8073   int size;
8074   int prefix;
8075   int code16;
8076
8077   code16 = 0;
8078   if (flag_code == CODE_16BIT)
8079     code16 = CODE16;
8080
8081   prefix = 0;
8082   if (i.prefix[DATA_PREFIX] != 0)
8083     {
8084       prefix = 1;
8085       i.prefixes -= 1;
8086       code16 ^= CODE16;
8087     }
8088
8089   gas_assert (!i.prefix[REX_PREFIX]);
8090
8091   size = 4;
8092   if (code16)
8093     size = 2;
8094
8095   if (i.prefixes != 0)
8096     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8097
8098   /* 1 opcode; 2 segment; offset  */
8099   p = frag_more (prefix + 1 + 2 + size);
8100
8101   if (i.prefix[DATA_PREFIX] != 0)
8102     *p++ = DATA_PREFIX_OPCODE;
8103
8104   if (i.prefix[REX_PREFIX] != 0)
8105     *p++ = i.prefix[REX_PREFIX];
8106
8107   *p++ = i.tm.base_opcode;
8108   if (i.op[1].imms->X_op == O_constant)
8109     {
8110       offsetT n = i.op[1].imms->X_add_number;
8111
8112       if (size == 2
8113           && !fits_in_unsigned_word (n)
8114           && !fits_in_signed_word (n))
8115         {
8116           as_bad (_("16-bit jump out of range"));
8117           return;
8118         }
8119       md_number_to_chars (p, n, size);
8120     }
8121   else
8122     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8123                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8124   if (i.op[0].imms->X_op != O_constant)
8125     as_bad (_("can't handle non absolute segment in `%s'"),
8126             i.tm.name);
8127   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8128 }
8129
8130 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8131 void
8132 x86_cleanup (void)
8133 {
8134   char *p;
8135   asection *seg = now_seg;
8136   subsegT subseg = now_subseg;
8137   asection *sec;
8138   unsigned int alignment, align_size_1;
8139   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8140   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8141   unsigned int padding;
8142
8143   if (!IS_ELF || !x86_used_note)
8144     return;
8145
8146   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8147
8148   /* The .note.gnu.property section layout:
8149
8150      Field      Length          Contents
8151      ----       ----            ----
8152      n_namsz    4               4
8153      n_descsz   4               The note descriptor size
8154      n_type     4               NT_GNU_PROPERTY_TYPE_0
8155      n_name     4               "GNU"
8156      n_desc     n_descsz        The program property array
8157      ....       ....            ....
8158    */
8159
8160   /* Create the .note.gnu.property section.  */
8161   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8162   bfd_set_section_flags (sec,
8163                          (SEC_ALLOC
8164                           | SEC_LOAD
8165                           | SEC_DATA
8166                           | SEC_HAS_CONTENTS
8167                           | SEC_READONLY));
8168
8169   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8170     {
8171       align_size_1 = 7;
8172       alignment = 3;
8173     }
8174   else
8175     {
8176       align_size_1 = 3;
8177       alignment = 2;
8178     }
8179
8180   bfd_set_section_alignment (sec, alignment);
8181   elf_section_type (sec) = SHT_NOTE;
8182
8183   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8184                                   + 4-byte data  */
8185   isa_1_descsz_raw = 4 + 4 + 4;
8186   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8187   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8188
8189   feature_2_descsz_raw = isa_1_descsz;
8190   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8191                                       + 4-byte data  */
8192   feature_2_descsz_raw += 4 + 4 + 4;
8193   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8194   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8195                       & ~align_size_1);
8196
8197   descsz = feature_2_descsz;
8198   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8199   p = frag_more (4 + 4 + 4 + 4 + descsz);
8200
8201   /* Write n_namsz.  */
8202   md_number_to_chars (p, (valueT) 4, 4);
8203
8204   /* Write n_descsz.  */
8205   md_number_to_chars (p + 4, (valueT) descsz, 4);
8206
8207   /* Write n_type.  */
8208   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8209
8210   /* Write n_name.  */
8211   memcpy (p + 4 * 3, "GNU", 4);
8212
8213   /* Write 4-byte type.  */
8214   md_number_to_chars (p + 4 * 4,
8215                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8216
8217   /* Write 4-byte data size.  */
8218   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8219
8220   /* Write 4-byte data.  */
8221   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8222
8223   /* Zero out paddings.  */
8224   padding = isa_1_descsz - isa_1_descsz_raw;
8225   if (padding)
8226     memset (p + 4 * 7, 0, padding);
8227
8228   /* Write 4-byte type.  */
8229   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8230                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8231
8232   /* Write 4-byte data size.  */
8233   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8234
8235   /* Write 4-byte data.  */
8236   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8237                       (valueT) x86_feature_2_used, 4);
8238
8239   /* Zero out paddings.  */
8240   padding = feature_2_descsz - feature_2_descsz_raw;
8241   if (padding)
8242     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8243
8244   /* We probably can't restore the current segment, for there likely
8245      isn't one yet...  */
8246   if (seg && subseg)
8247     subseg_set (seg, subseg);
8248 }
8249 #endif
8250
8251 static unsigned int
8252 encoding_length (const fragS *start_frag, offsetT start_off,
8253                  const char *frag_now_ptr)
8254 {
8255   unsigned int len = 0;
8256
8257   if (start_frag != frag_now)
8258     {
8259       const fragS *fr = start_frag;
8260
8261       do {
8262         len += fr->fr_fix;
8263         fr = fr->fr_next;
8264       } while (fr && fr != frag_now);
8265     }
8266
8267   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8268 }
8269
8270 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8271    be macro-fused with conditional jumps.  */
8272
8273 static int
8274 maybe_fused_with_jcc_p (void)
8275 {
8276   /* No RIP address.  */
8277   if (i.base_reg && i.base_reg->reg_num == RegIP)
8278     return 0;
8279
8280   /* No VEX/EVEX encoding.  */
8281   if (is_any_vex_encoding (&i.tm))
8282     return 0;
8283
8284   /* and, add, sub with destination register.  */
8285   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8286       || i.tm.base_opcode <= 5
8287       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8288       || ((i.tm.base_opcode | 3) == 0x83
8289           && ((i.tm.extension_opcode | 1) == 0x5
8290               || i.tm.extension_opcode == 0x0)))
8291     return (i.types[1].bitfield.class == Reg
8292             || i.types[1].bitfield.instance == Accum);
8293
8294   /* test, cmp with any register.  */
8295   if ((i.tm.base_opcode | 1) == 0x85
8296       || (i.tm.base_opcode | 1) == 0xa9
8297       || ((i.tm.base_opcode | 1) == 0xf7
8298           && i.tm.extension_opcode == 0)
8299       || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8300       || ((i.tm.base_opcode | 3) == 0x83
8301           && (i.tm.extension_opcode == 0x7)))
8302     return (i.types[0].bitfield.class == Reg
8303             || i.types[0].bitfield.instance == Accum
8304             || i.types[1].bitfield.class == Reg
8305             || i.types[1].bitfield.instance == Accum);
8306
8307   /* inc, dec with any register.   */
8308   if ((i.tm.cpu_flags.bitfield.cpuno64
8309        && (i.tm.base_opcode | 0xf) == 0x4f)
8310       || ((i.tm.base_opcode | 1) == 0xff
8311           && i.tm.extension_opcode <= 0x1))
8312     return (i.types[0].bitfield.class == Reg
8313             || i.types[0].bitfield.instance == Accum);
8314
8315   return 0;
8316 }
8317
8318 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
8319
8320 static int
8321 add_fused_jcc_padding_frag_p (void)
8322 {
8323   /* NB: Don't work with COND_JUMP86 without i386.  */
8324   if (!align_branch_power
8325       || now_seg == absolute_section
8326       || !cpu_arch_flags.bitfield.cpui386
8327       || !(align_branch & align_branch_fused_bit))
8328     return 0;
8329
8330   if (maybe_fused_with_jcc_p ())
8331     {
8332       if (last_insn.kind == last_insn_other
8333           || last_insn.seg != now_seg)
8334         return 1;
8335       if (flag_debug)
8336         as_warn_where (last_insn.file, last_insn.line,
8337                        _("`%s` skips -malign-branch-boundary on `%s`"),
8338                        last_insn.name, i.tm.name);
8339     }
8340
8341   return 0;
8342 }
8343
8344 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
8345
8346 static int
8347 add_branch_prefix_frag_p (void)
8348 {
8349   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
8350      to PadLock instructions since they include prefixes in opcode.  */
8351   if (!align_branch_power
8352       || !align_branch_prefix_size
8353       || now_seg == absolute_section
8354       || i.tm.cpu_flags.bitfield.cpupadlock
8355       || !cpu_arch_flags.bitfield.cpui386)
8356     return 0;
8357
8358   /* Don't add prefix if it is a prefix or there is no operand in case
8359      that segment prefix is special.  */
8360   if (!i.operands || i.tm.opcode_modifier.isprefix)
8361     return 0;
8362
8363   if (last_insn.kind == last_insn_other
8364       || last_insn.seg != now_seg)
8365     return 1;
8366
8367   if (flag_debug)
8368     as_warn_where (last_insn.file, last_insn.line,
8369                    _("`%s` skips -malign-branch-boundary on `%s`"),
8370                    last_insn.name, i.tm.name);
8371
8372   return 0;
8373 }
8374
8375 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
8376
8377 static int
8378 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8379 {
8380   int add_padding;
8381
8382   /* NB: Don't work with COND_JUMP86 without i386.  */
8383   if (!align_branch_power
8384       || now_seg == absolute_section
8385       || !cpu_arch_flags.bitfield.cpui386)
8386     return 0;
8387
8388   add_padding = 0;
8389
8390   /* Check for jcc and direct jmp.  */
8391   if (i.tm.opcode_modifier.jump == JUMP)
8392     {
8393       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8394         {
8395           *branch_p = align_branch_jmp;
8396           add_padding = align_branch & align_branch_jmp_bit;
8397         }
8398       else
8399         {
8400           *branch_p = align_branch_jcc;
8401           if ((align_branch & align_branch_jcc_bit))
8402             add_padding = 1;
8403         }
8404     }
8405   else if (is_any_vex_encoding (&i.tm))
8406     return 0;
8407   else if ((i.tm.base_opcode | 1) == 0xc3)
8408     {
8409       /* Near ret.  */
8410       *branch_p = align_branch_ret;
8411       if ((align_branch & align_branch_ret_bit))
8412         add_padding = 1;
8413     }
8414   else
8415     {
8416       /* Check for indirect jmp, direct and indirect calls.  */
8417       if (i.tm.base_opcode == 0xe8)
8418         {
8419           /* Direct call.  */
8420           *branch_p = align_branch_call;
8421           if ((align_branch & align_branch_call_bit))
8422             add_padding = 1;
8423         }
8424       else if (i.tm.base_opcode == 0xff
8425                && (i.tm.extension_opcode == 2
8426                    || i.tm.extension_opcode == 4))
8427         {
8428           /* Indirect call and jmp.  */
8429           *branch_p = align_branch_indirect;
8430           if ((align_branch & align_branch_indirect_bit))
8431             add_padding = 1;
8432         }
8433
8434       if (add_padding
8435           && i.disp_operands
8436           && tls_get_addr
8437           && (i.op[0].disps->X_op == O_symbol
8438               || (i.op[0].disps->X_op == O_subtract
8439                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
8440         {
8441           symbolS *s = i.op[0].disps->X_add_symbol;
8442           /* No padding to call to global or undefined tls_get_addr.  */
8443           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8444               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8445             return 0;
8446         }
8447     }
8448
8449   if (add_padding
8450       && last_insn.kind != last_insn_other
8451       && last_insn.seg == now_seg)
8452     {
8453       if (flag_debug)
8454         as_warn_where (last_insn.file, last_insn.line,
8455                        _("`%s` skips -malign-branch-boundary on `%s`"),
8456                        last_insn.name, i.tm.name);
8457       return 0;
8458     }
8459
8460   return add_padding;
8461 }
8462
8463 static void
8464 output_insn (void)
8465 {
8466   fragS *insn_start_frag;
8467   offsetT insn_start_off;
8468   fragS *fragP = NULL;
8469   enum align_branch_kind branch = align_branch_none;
8470
8471 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8472   if (IS_ELF && x86_used_note)
8473     {
8474       if (i.tm.cpu_flags.bitfield.cpucmov)
8475         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8476       if (i.tm.cpu_flags.bitfield.cpusse)
8477         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8478       if (i.tm.cpu_flags.bitfield.cpusse2)
8479         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8480       if (i.tm.cpu_flags.bitfield.cpusse3)
8481         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8482       if (i.tm.cpu_flags.bitfield.cpussse3)
8483         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8484       if (i.tm.cpu_flags.bitfield.cpusse4_1)
8485         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8486       if (i.tm.cpu_flags.bitfield.cpusse4_2)
8487         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8488       if (i.tm.cpu_flags.bitfield.cpuavx)
8489         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8490       if (i.tm.cpu_flags.bitfield.cpuavx2)
8491         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8492       if (i.tm.cpu_flags.bitfield.cpufma)
8493         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8494       if (i.tm.cpu_flags.bitfield.cpuavx512f)
8495         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8496       if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8497         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8498       if (i.tm.cpu_flags.bitfield.cpuavx512er)
8499         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8500       if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8501         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8502       if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8503         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8504       if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8505         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8506       if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8507         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8508       if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8509         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8510       if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8511         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8512       if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8513         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8514       if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8515         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8516       if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8517         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8518       if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8519         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8520       if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8521         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8522       if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8523         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8524
8525       if (i.tm.cpu_flags.bitfield.cpu8087
8526           || i.tm.cpu_flags.bitfield.cpu287
8527           || i.tm.cpu_flags.bitfield.cpu387
8528           || i.tm.cpu_flags.bitfield.cpu687
8529           || i.tm.cpu_flags.bitfield.cpufisttp)
8530         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8531       if (i.has_regmmx
8532           || i.tm.base_opcode == 0xf77 /* emms */
8533           || i.tm.base_opcode == 0xf0e /* femms */)
8534         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8535       if (i.has_regxmm)
8536         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8537       if (i.has_regymm)
8538         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8539       if (i.has_regzmm)
8540         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8541       if (i.tm.cpu_flags.bitfield.cpufxsr)
8542         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8543       if (i.tm.cpu_flags.bitfield.cpuxsave)
8544         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8545       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8546         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8547       if (i.tm.cpu_flags.bitfield.cpuxsavec)
8548         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8549     }
8550 #endif
8551
8552   /* Tie dwarf2 debug info to the address at the start of the insn.
8553      We can't do this after the insn has been output as the current
8554      frag may have been closed off.  eg. by frag_var.  */
8555   dwarf2_emit_insn (0);
8556
8557   insn_start_frag = frag_now;
8558   insn_start_off = frag_now_fix ();
8559
8560   if (add_branch_padding_frag_p (&branch))
8561     {
8562       char *p;
8563       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
8564       unsigned int max_branch_padding_size = 14;
8565
8566       /* Align section to boundary.  */
8567       record_alignment (now_seg, align_branch_power);
8568
8569       /* Make room for padding.  */
8570       frag_grow (max_branch_padding_size);
8571
8572       /* Start of the padding.  */
8573       p = frag_more (0);
8574
8575       fragP = frag_now;
8576
8577       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8578                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8579                 NULL, 0, p);
8580
8581       fragP->tc_frag_data.branch_type = branch;
8582       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8583     }
8584
8585   /* Output jumps.  */
8586   if (i.tm.opcode_modifier.jump == JUMP)
8587     output_branch ();
8588   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8589            || i.tm.opcode_modifier.jump == JUMP_DWORD)
8590     output_jump ();
8591   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8592     output_interseg_jump ();
8593   else
8594     {
8595       /* Output normal instructions here.  */
8596       char *p;
8597       unsigned char *q;
8598       unsigned int j;
8599       unsigned int prefix;
8600
8601       if (avoid_fence
8602           && (i.tm.base_opcode == 0xfaee8
8603               || i.tm.base_opcode == 0xfaef0
8604               || i.tm.base_opcode == 0xfaef8))
8605         {
8606           /* Encode lfence, mfence, and sfence as
8607              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
8608           offsetT val = 0x240483f0ULL;
8609           p = frag_more (5);
8610           md_number_to_chars (p, val, 5);
8611           return;
8612         }
8613
8614       /* Some processors fail on LOCK prefix. This options makes
8615          assembler ignore LOCK prefix and serves as a workaround.  */
8616       if (omit_lock_prefix)
8617         {
8618           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8619             return;
8620           i.prefix[LOCK_PREFIX] = 0;
8621         }
8622
8623       if (branch)
8624         /* Skip if this is a branch.  */
8625         ;
8626       else if (add_fused_jcc_padding_frag_p ())
8627         {
8628           /* Make room for padding.  */
8629           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8630           p = frag_more (0);
8631
8632           fragP = frag_now;
8633
8634           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8635                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8636                     NULL, 0, p);
8637
8638           fragP->tc_frag_data.branch_type = align_branch_fused;
8639           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8640         }
8641       else if (add_branch_prefix_frag_p ())
8642         {
8643           unsigned int max_prefix_size = align_branch_prefix_size;
8644
8645           /* Make room for padding.  */
8646           frag_grow (max_prefix_size);
8647           p = frag_more (0);
8648
8649           fragP = frag_now;
8650
8651           frag_var (rs_machine_dependent, max_prefix_size, 0,
8652                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8653                     NULL, 0, p);
8654
8655           fragP->tc_frag_data.max_bytes = max_prefix_size;
8656         }
8657
8658       /* Since the VEX/EVEX prefix contains the implicit prefix, we
8659          don't need the explicit prefix.  */
8660       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8661         {
8662           switch (i.tm.opcode_length)
8663             {
8664             case 3:
8665               if (i.tm.base_opcode & 0xff000000)
8666                 {
8667                   prefix = (i.tm.base_opcode >> 24) & 0xff;
8668                   if (!i.tm.cpu_flags.bitfield.cpupadlock
8669                       || prefix != REPE_PREFIX_OPCODE
8670                       || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8671                     add_prefix (prefix);
8672                 }
8673               break;
8674             case 2:
8675               if ((i.tm.base_opcode & 0xff0000) != 0)
8676                 {
8677                   prefix = (i.tm.base_opcode >> 16) & 0xff;
8678                   add_prefix (prefix);
8679                 }
8680               break;
8681             case 1:
8682               break;
8683             case 0:
8684               /* Check for pseudo prefixes.  */
8685               as_bad_where (insn_start_frag->fr_file,
8686                             insn_start_frag->fr_line,
8687                              _("pseudo prefix without instruction"));
8688               return;
8689             default:
8690               abort ();
8691             }
8692
8693 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8694           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8695              R_X86_64_GOTTPOFF relocation so that linker can safely
8696              perform IE->LE optimization.  A dummy REX_OPCODE prefix
8697              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
8698              relocation for GDesc -> IE/LE optimization.  */
8699           if (x86_elf_abi == X86_64_X32_ABI
8700               && i.operands == 2
8701               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8702                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
8703               && i.prefix[REX_PREFIX] == 0)
8704             add_prefix (REX_OPCODE);
8705 #endif
8706
8707           /* The prefix bytes.  */
8708           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8709             if (*q)
8710               FRAG_APPEND_1_CHAR (*q);
8711         }
8712       else
8713         {
8714           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8715             if (*q)
8716               switch (j)
8717                 {
8718                 case REX_PREFIX:
8719                   /* REX byte is encoded in VEX prefix.  */
8720                   break;
8721                 case SEG_PREFIX:
8722                 case ADDR_PREFIX:
8723                   FRAG_APPEND_1_CHAR (*q);
8724                   break;
8725                 default:
8726                   /* There should be no other prefixes for instructions
8727                      with VEX prefix.  */
8728                   abort ();
8729                 }
8730
8731           /* For EVEX instructions i.vrex should become 0 after
8732              build_evex_prefix.  For VEX instructions upper 16 registers
8733              aren't available, so VREX should be 0.  */
8734           if (i.vrex)
8735             abort ();
8736           /* Now the VEX prefix.  */
8737           p = frag_more (i.vex.length);
8738           for (j = 0; j < i.vex.length; j++)
8739             p[j] = i.vex.bytes[j];
8740         }
8741
8742       /* Now the opcode; be careful about word order here!  */
8743       if (i.tm.opcode_length == 1)
8744         {
8745           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8746         }
8747       else
8748         {
8749           switch (i.tm.opcode_length)
8750             {
8751             case 4:
8752               p = frag_more (4);
8753               *p++ = (i.tm.base_opcode >> 24) & 0xff;
8754               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8755               break;
8756             case 3:
8757               p = frag_more (3);
8758               *p++ = (i.tm.base_opcode >> 16) & 0xff;
8759               break;
8760             case 2:
8761               p = frag_more (2);
8762               break;
8763             default:
8764               abort ();
8765               break;
8766             }
8767
8768           /* Put out high byte first: can't use md_number_to_chars!  */
8769           *p++ = (i.tm.base_opcode >> 8) & 0xff;
8770           *p = i.tm.base_opcode & 0xff;
8771         }
8772
8773       /* Now the modrm byte and sib byte (if present).  */
8774       if (i.tm.opcode_modifier.modrm)
8775         {
8776           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8777                                | i.rm.reg << 3
8778                                | i.rm.mode << 6));
8779           /* If i.rm.regmem == ESP (4)
8780              && i.rm.mode != (Register mode)
8781              && not 16 bit
8782              ==> need second modrm byte.  */
8783           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8784               && i.rm.mode != 3
8785               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8786             FRAG_APPEND_1_CHAR ((i.sib.base << 0
8787                                  | i.sib.index << 3
8788                                  | i.sib.scale << 6));
8789         }
8790
8791       if (i.disp_operands)
8792         output_disp (insn_start_frag, insn_start_off);
8793
8794       if (i.imm_operands)
8795         output_imm (insn_start_frag, insn_start_off);
8796
8797       /*
8798        * frag_now_fix () returning plain abs_section_offset when we're in the
8799        * absolute section, and abs_section_offset not getting updated as data
8800        * gets added to the frag breaks the logic below.
8801        */
8802       if (now_seg != absolute_section)
8803         {
8804           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8805           if (j > 15)
8806             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8807                      j);
8808           else if (fragP)
8809             {
8810               /* NB: Don't add prefix with GOTPC relocation since
8811                  output_disp() above depends on the fixed encoding
8812                  length.  Can't add prefix with TLS relocation since
8813                  it breaks TLS linker optimization.  */
8814               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8815               /* Prefix count on the current instruction.  */
8816               unsigned int count = i.vex.length;
8817               unsigned int k;
8818               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8819                 /* REX byte is encoded in VEX/EVEX prefix.  */
8820                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8821                   count++;
8822
8823               /* Count prefixes for extended opcode maps.  */
8824               if (!i.vex.length)
8825                 switch (i.tm.opcode_length)
8826                   {
8827                   case 3:
8828                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8829                       {
8830                         count++;
8831                         switch ((i.tm.base_opcode >> 8) & 0xff)
8832                           {
8833                           case 0x38:
8834                           case 0x3a:
8835                             count++;
8836                             break;
8837                           default:
8838                             break;
8839                           }
8840                       }
8841                     break;
8842                   case 2:
8843                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8844                       count++;
8845                     break;
8846                   case 1:
8847                     break;
8848                   default:
8849                     abort ();
8850                   }
8851
8852               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8853                   == BRANCH_PREFIX)
8854                 {
8855                   /* Set the maximum prefix size in BRANCH_PREFIX
8856                      frag.  */
8857                   if (fragP->tc_frag_data.max_bytes > max)
8858                     fragP->tc_frag_data.max_bytes = max;
8859                   if (fragP->tc_frag_data.max_bytes > count)
8860                     fragP->tc_frag_data.max_bytes -= count;
8861                   else
8862                     fragP->tc_frag_data.max_bytes = 0;
8863                 }
8864               else
8865                 {
8866                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
8867                      frag.  */
8868                   unsigned int max_prefix_size;
8869                   if (align_branch_prefix_size > max)
8870                     max_prefix_size = max;
8871                   else
8872                     max_prefix_size = align_branch_prefix_size;
8873                   if (max_prefix_size > count)
8874                     fragP->tc_frag_data.max_prefix_length
8875                       = max_prefix_size - count;
8876                 }
8877
8878               /* Use existing segment prefix if possible.  Use CS
8879                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
8880                  segment prefix with ESP/EBP base register and use DS
8881                  segment prefix without ESP/EBP base register.  */
8882               if (i.prefix[SEG_PREFIX])
8883                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8884               else if (flag_code == CODE_64BIT)
8885                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8886               else if (i.base_reg
8887                        && (i.base_reg->reg_num == 4
8888                            || i.base_reg->reg_num == 5))
8889                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8890               else
8891                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8892             }
8893         }
8894     }
8895
8896   /* NB: Don't work with COND_JUMP86 without i386.  */
8897   if (align_branch_power
8898       && now_seg != absolute_section
8899       && cpu_arch_flags.bitfield.cpui386)
8900     {
8901       /* Terminate each frag so that we can add prefix and check for
8902          fused jcc.  */
8903       frag_wane (frag_now);
8904       frag_new (0);
8905     }
8906
8907 #ifdef DEBUG386
8908   if (flag_debug)
8909     {
8910       pi ("" /*line*/, &i);
8911     }
8912 #endif /* DEBUG386  */
8913 }
8914
8915 /* Return the size of the displacement operand N.  */
8916
8917 static int
8918 disp_size (unsigned int n)
8919 {
8920   int size = 4;
8921
8922   if (i.types[n].bitfield.disp64)
8923     size = 8;
8924   else if (i.types[n].bitfield.disp8)
8925     size = 1;
8926   else if (i.types[n].bitfield.disp16)
8927     size = 2;
8928   return size;
8929 }
8930
8931 /* Return the size of the immediate operand N.  */
8932
8933 static int
8934 imm_size (unsigned int n)
8935 {
8936   int size = 4;
8937   if (i.types[n].bitfield.imm64)
8938     size = 8;
8939   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8940     size = 1;
8941   else if (i.types[n].bitfield.imm16)
8942     size = 2;
8943   return size;
8944 }
8945
8946 static void
8947 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8948 {
8949   char *p;
8950   unsigned int n;
8951
8952   for (n = 0; n < i.operands; n++)
8953     {
8954       if (operand_type_check (i.types[n], disp))
8955         {
8956           if (i.op[n].disps->X_op == O_constant)
8957             {
8958               int size = disp_size (n);
8959               offsetT val = i.op[n].disps->X_add_number;
8960
8961               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8962                                      size);
8963               p = frag_more (size);
8964               md_number_to_chars (p, val, size);
8965             }
8966           else
8967             {
8968               enum bfd_reloc_code_real reloc_type;
8969               int size = disp_size (n);
8970               int sign = i.types[n].bitfield.disp32s;
8971               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8972               fixS *fixP;
8973
8974               /* We can't have 8 bit displacement here.  */
8975               gas_assert (!i.types[n].bitfield.disp8);
8976
8977               /* The PC relative address is computed relative
8978                  to the instruction boundary, so in case immediate
8979                  fields follows, we need to adjust the value.  */
8980               if (pcrel && i.imm_operands)
8981                 {
8982                   unsigned int n1;
8983                   int sz = 0;
8984
8985                   for (n1 = 0; n1 < i.operands; n1++)
8986                     if (operand_type_check (i.types[n1], imm))
8987                       {
8988                         /* Only one immediate is allowed for PC
8989                            relative address.  */
8990                         gas_assert (sz == 0);
8991                         sz = imm_size (n1);
8992                         i.op[n].disps->X_add_number -= sz;
8993                       }
8994                   /* We should find the immediate.  */
8995                   gas_assert (sz != 0);
8996                 }
8997
8998               p = frag_more (size);
8999               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9000               if (GOT_symbol
9001                   && GOT_symbol == i.op[n].disps->X_add_symbol
9002                   && (((reloc_type == BFD_RELOC_32
9003                         || reloc_type == BFD_RELOC_X86_64_32S
9004                         || (reloc_type == BFD_RELOC_64
9005                             && object_64bit))
9006                        && (i.op[n].disps->X_op == O_symbol
9007                            || (i.op[n].disps->X_op == O_add
9008                                && ((symbol_get_value_expression
9009                                     (i.op[n].disps->X_op_symbol)->X_op)
9010                                    == O_subtract))))
9011                       || reloc_type == BFD_RELOC_32_PCREL))
9012                 {
9013                   if (!object_64bit)
9014                     {
9015                       reloc_type = BFD_RELOC_386_GOTPC;
9016                       i.has_gotpc_tls_reloc = TRUE;
9017                       i.op[n].imms->X_add_number +=
9018                         encoding_length (insn_start_frag, insn_start_off, p);
9019                     }
9020                   else if (reloc_type == BFD_RELOC_64)
9021                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9022                   else
9023                     /* Don't do the adjustment for x86-64, as there
9024                        the pcrel addressing is relative to the _next_
9025                        insn, and that is taken care of in other code.  */
9026                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9027                 }
9028               else if (align_branch_power)
9029                 {
9030                   switch (reloc_type)
9031                     {
9032                     case BFD_RELOC_386_TLS_GD:
9033                     case BFD_RELOC_386_TLS_LDM:
9034                     case BFD_RELOC_386_TLS_IE:
9035                     case BFD_RELOC_386_TLS_IE_32:
9036                     case BFD_RELOC_386_TLS_GOTIE:
9037                     case BFD_RELOC_386_TLS_GOTDESC:
9038                     case BFD_RELOC_386_TLS_DESC_CALL:
9039                     case BFD_RELOC_X86_64_TLSGD:
9040                     case BFD_RELOC_X86_64_TLSLD:
9041                     case BFD_RELOC_X86_64_GOTTPOFF:
9042                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9043                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9044                       i.has_gotpc_tls_reloc = TRUE;
9045                     default:
9046                       break;
9047                     }
9048                 }
9049               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9050                                   size, i.op[n].disps, pcrel,
9051                                   reloc_type);
9052               /* Check for "call/jmp *mem", "mov mem, %reg",
9053                  "test %reg, mem" and "binop mem, %reg" where binop
9054                  is one of adc, add, and, cmp, or, sbb, sub, xor
9055                  instructions without data prefix.  Always generate
9056                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9057               if (i.prefix[DATA_PREFIX] == 0
9058                   && (generate_relax_relocations
9059                       || (!object_64bit
9060                           && i.rm.mode == 0
9061                           && i.rm.regmem == 5))
9062                   && (i.rm.mode == 2
9063                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9064                   && !is_any_vex_encoding(&i.tm)
9065                   && ((i.operands == 1
9066                        && i.tm.base_opcode == 0xff
9067                        && (i.rm.reg == 2 || i.rm.reg == 4))
9068                       || (i.operands == 2
9069                           && (i.tm.base_opcode == 0x8b
9070                               || i.tm.base_opcode == 0x85
9071                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9072                 {
9073                   if (object_64bit)
9074                     {
9075                       fixP->fx_tcbit = i.rex != 0;
9076                       if (i.base_reg
9077                           && (i.base_reg->reg_num == RegIP))
9078                       fixP->fx_tcbit2 = 1;
9079                     }
9080                   else
9081                     fixP->fx_tcbit2 = 1;
9082                 }
9083             }
9084         }
9085     }
9086 }
9087
9088 static void
9089 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9090 {
9091   char *p;
9092   unsigned int n;
9093
9094   for (n = 0; n < i.operands; n++)
9095     {
9096       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9097       if (i.rounding && (int) n == i.rounding->operand)
9098         continue;
9099
9100       if (operand_type_check (i.types[n], imm))
9101         {
9102           if (i.op[n].imms->X_op == O_constant)
9103             {
9104               int size = imm_size (n);
9105               offsetT val;
9106
9107               val = offset_in_range (i.op[n].imms->X_add_number,
9108                                      size);
9109               p = frag_more (size);
9110               md_number_to_chars (p, val, size);
9111             }
9112           else
9113             {
9114               /* Not absolute_section.
9115                  Need a 32-bit fixup (don't support 8bit
9116                  non-absolute imms).  Try to support other
9117                  sizes ...  */
9118               enum bfd_reloc_code_real reloc_type;
9119               int size = imm_size (n);
9120               int sign;
9121
9122               if (i.types[n].bitfield.imm32s
9123                   && (i.suffix == QWORD_MNEM_SUFFIX
9124                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9125                 sign = 1;
9126               else
9127                 sign = 0;
9128
9129               p = frag_more (size);
9130               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9131
9132               /*   This is tough to explain.  We end up with this one if we
9133                * have operands that look like
9134                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9135                * obtain the absolute address of the GOT, and it is strongly
9136                * preferable from a performance point of view to avoid using
9137                * a runtime relocation for this.  The actual sequence of
9138                * instructions often look something like:
9139                *
9140                *        call    .L66
9141                * .L66:
9142                *        popl    %ebx
9143                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9144                *
9145                *   The call and pop essentially return the absolute address
9146                * of the label .L66 and store it in %ebx.  The linker itself
9147                * will ultimately change the first operand of the addl so
9148                * that %ebx points to the GOT, but to keep things simple, the
9149                * .o file must have this operand set so that it generates not
9150                * the absolute address of .L66, but the absolute address of
9151                * itself.  This allows the linker itself simply treat a GOTPC
9152                * relocation as asking for a pcrel offset to the GOT to be
9153                * added in, and the addend of the relocation is stored in the
9154                * operand field for the instruction itself.
9155                *
9156                *   Our job here is to fix the operand so that it would add
9157                * the correct offset so that %ebx would point to itself.  The
9158                * thing that is tricky is that .-.L66 will point to the
9159                * beginning of the instruction, so we need to further modify
9160                * the operand so that it will point to itself.  There are
9161                * other cases where you have something like:
9162                *
9163                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9164                *
9165                * and here no correction would be required.  Internally in
9166                * the assembler we treat operands of this form as not being
9167                * pcrel since the '.' is explicitly mentioned, and I wonder
9168                * whether it would simplify matters to do it this way.  Who
9169                * knows.  In earlier versions of the PIC patches, the
9170                * pcrel_adjust field was used to store the correction, but
9171                * since the expression is not pcrel, I felt it would be
9172                * confusing to do it this way.  */
9173
9174               if ((reloc_type == BFD_RELOC_32
9175                    || reloc_type == BFD_RELOC_X86_64_32S
9176                    || reloc_type == BFD_RELOC_64)
9177                   && GOT_symbol
9178                   && GOT_symbol == i.op[n].imms->X_add_symbol
9179                   && (i.op[n].imms->X_op == O_symbol
9180                       || (i.op[n].imms->X_op == O_add
9181                           && ((symbol_get_value_expression
9182                                (i.op[n].imms->X_op_symbol)->X_op)
9183                               == O_subtract))))
9184                 {
9185                   if (!object_64bit)
9186                     reloc_type = BFD_RELOC_386_GOTPC;
9187                   else if (size == 4)
9188                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9189                   else if (size == 8)
9190                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9191                   i.has_gotpc_tls_reloc = TRUE;
9192                   i.op[n].imms->X_add_number +=
9193                     encoding_length (insn_start_frag, insn_start_off, p);
9194                 }
9195               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9196                            i.op[n].imms, 0, reloc_type);
9197             }
9198         }
9199     }
9200 }
9201 \f
9202 /* x86_cons_fix_new is called via the expression parsing code when a
9203    reloc is needed.  We use this hook to get the correct .got reloc.  */
9204 static int cons_sign = -1;
9205
9206 void
9207 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9208                   expressionS *exp, bfd_reloc_code_real_type r)
9209 {
9210   r = reloc (len, 0, cons_sign, r);
9211
9212 #ifdef TE_PE
9213   if (exp->X_op == O_secrel)
9214     {
9215       exp->X_op = O_symbol;
9216       r = BFD_RELOC_32_SECREL;
9217     }
9218 #endif
9219
9220   fix_new_exp (frag, off, len, exp, 0, r);
9221 }
9222
9223 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9224    purpose of the `.dc.a' internal pseudo-op.  */
9225
9226 int
9227 x86_address_bytes (void)
9228 {
9229   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9230     return 4;
9231   return stdoutput->arch_info->bits_per_address / 8;
9232 }
9233
9234 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9235     || defined (LEX_AT)
9236 # define lex_got(reloc, adjust, types) NULL
9237 #else
9238 /* Parse operands of the form
9239    <symbol>@GOTOFF+<nnn>
9240    and similar .plt or .got references.
9241
9242    If we find one, set up the correct relocation in RELOC and copy the
9243    input string, minus the `@GOTOFF' into a malloc'd buffer for
9244    parsing by the calling routine.  Return this buffer, and if ADJUST
9245    is non-null set it to the length of the string we removed from the
9246    input line.  Otherwise return NULL.  */
9247 static char *
9248 lex_got (enum bfd_reloc_code_real *rel,
9249          int *adjust,
9250          i386_operand_type *types)
9251 {
9252   /* Some of the relocations depend on the size of what field is to
9253      be relocated.  But in our callers i386_immediate and i386_displacement
9254      we don't yet know the operand size (this will be set by insn
9255      matching).  Hence we record the word32 relocation here,
9256      and adjust the reloc according to the real size in reloc().  */
9257   static const struct {
9258     const char *str;
9259     int len;
9260     const enum bfd_reloc_code_real rel[2];
9261     const i386_operand_type types64;
9262   } gotrel[] = {
9263 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9264     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
9265                                         BFD_RELOC_SIZE32 },
9266       OPERAND_TYPE_IMM32_64 },
9267 #endif
9268     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
9269                                        BFD_RELOC_X86_64_PLTOFF64 },
9270       OPERAND_TYPE_IMM64 },
9271     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
9272                                        BFD_RELOC_X86_64_PLT32    },
9273       OPERAND_TYPE_IMM32_32S_DISP32 },
9274     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
9275                                        BFD_RELOC_X86_64_GOTPLT64 },
9276       OPERAND_TYPE_IMM64_DISP64 },
9277     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
9278                                        BFD_RELOC_X86_64_GOTOFF64 },
9279       OPERAND_TYPE_IMM64_DISP64 },
9280     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9281                                        BFD_RELOC_X86_64_GOTPCREL },
9282       OPERAND_TYPE_IMM32_32S_DISP32 },
9283     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
9284                                        BFD_RELOC_X86_64_TLSGD    },
9285       OPERAND_TYPE_IMM32_32S_DISP32 },
9286     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
9287                                        _dummy_first_bfd_reloc_code_real },
9288       OPERAND_TYPE_NONE },
9289     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
9290                                        BFD_RELOC_X86_64_TLSLD    },
9291       OPERAND_TYPE_IMM32_32S_DISP32 },
9292     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9293                                        BFD_RELOC_X86_64_GOTTPOFF },
9294       OPERAND_TYPE_IMM32_32S_DISP32 },
9295     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
9296                                        BFD_RELOC_X86_64_TPOFF32  },
9297       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9298     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
9299                                        _dummy_first_bfd_reloc_code_real },
9300       OPERAND_TYPE_NONE },
9301     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
9302                                        BFD_RELOC_X86_64_DTPOFF32 },
9303       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9304     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9305                                        _dummy_first_bfd_reloc_code_real },
9306       OPERAND_TYPE_NONE },
9307     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9308                                        _dummy_first_bfd_reloc_code_real },
9309       OPERAND_TYPE_NONE },
9310     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
9311                                        BFD_RELOC_X86_64_GOT32    },
9312       OPERAND_TYPE_IMM32_32S_64_DISP32 },
9313     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
9314                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9315       OPERAND_TYPE_IMM32_32S_DISP32 },
9316     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
9317                                        BFD_RELOC_X86_64_TLSDESC_CALL },
9318       OPERAND_TYPE_IMM32_32S_DISP32 },
9319   };
9320   char *cp;
9321   unsigned int j;
9322
9323 #if defined (OBJ_MAYBE_ELF)
9324   if (!IS_ELF)
9325     return NULL;
9326 #endif
9327
9328   for (cp = input_line_pointer; *cp != '@'; cp++)
9329     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9330       return NULL;
9331
9332   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9333     {
9334       int len = gotrel[j].len;
9335       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9336         {
9337           if (gotrel[j].rel[object_64bit] != 0)
9338             {
9339               int first, second;
9340               char *tmpbuf, *past_reloc;
9341
9342               *rel = gotrel[j].rel[object_64bit];
9343
9344               if (types)
9345                 {
9346                   if (flag_code != CODE_64BIT)
9347                     {
9348                       types->bitfield.imm32 = 1;
9349                       types->bitfield.disp32 = 1;
9350                     }
9351                   else
9352                     *types = gotrel[j].types64;
9353                 }
9354
9355               if (j != 0 && GOT_symbol == NULL)
9356                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9357
9358               /* The length of the first part of our input line.  */
9359               first = cp - input_line_pointer;
9360
9361               /* The second part goes from after the reloc token until
9362                  (and including) an end_of_line char or comma.  */
9363               past_reloc = cp + 1 + len;
9364               cp = past_reloc;
9365               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9366                 ++cp;
9367               second = cp + 1 - past_reloc;
9368
9369               /* Allocate and copy string.  The trailing NUL shouldn't
9370                  be necessary, but be safe.  */
9371               tmpbuf = XNEWVEC (char, first + second + 2);
9372               memcpy (tmpbuf, input_line_pointer, first);
9373               if (second != 0 && *past_reloc != ' ')
9374                 /* Replace the relocation token with ' ', so that
9375                    errors like foo@GOTOFF1 will be detected.  */
9376                 tmpbuf[first++] = ' ';
9377               else
9378                 /* Increment length by 1 if the relocation token is
9379                    removed.  */
9380                 len++;
9381               if (adjust)
9382                 *adjust = len;
9383               memcpy (tmpbuf + first, past_reloc, second);
9384               tmpbuf[first + second] = '\0';
9385               return tmpbuf;
9386             }
9387
9388           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9389                   gotrel[j].str, 1 << (5 + object_64bit));
9390           return NULL;
9391         }
9392     }
9393
9394   /* Might be a symbol version string.  Don't as_bad here.  */
9395   return NULL;
9396 }
9397 #endif
9398
9399 #ifdef TE_PE
9400 #ifdef lex_got
9401 #undef lex_got
9402 #endif
9403 /* Parse operands of the form
9404    <symbol>@SECREL32+<nnn>
9405
9406    If we find one, set up the correct relocation in RELOC and copy the
9407    input string, minus the `@SECREL32' into a malloc'd buffer for
9408    parsing by the calling routine.  Return this buffer, and if ADJUST
9409    is non-null set it to the length of the string we removed from the
9410    input line.  Otherwise return NULL.
9411
9412    This function is copied from the ELF version above adjusted for PE targets.  */
9413
9414 static char *
9415 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9416          int *adjust ATTRIBUTE_UNUSED,
9417          i386_operand_type *types)
9418 {
9419   static const struct
9420   {
9421     const char *str;
9422     int len;
9423     const enum bfd_reloc_code_real rel[2];
9424     const i386_operand_type types64;
9425   }
9426   gotrel[] =
9427   {
9428     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
9429                                           BFD_RELOC_32_SECREL },
9430       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9431   };
9432
9433   char *cp;
9434   unsigned j;
9435
9436   for (cp = input_line_pointer; *cp != '@'; cp++)
9437     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9438       return NULL;
9439
9440   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9441     {
9442       int len = gotrel[j].len;
9443
9444       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9445         {
9446           if (gotrel[j].rel[object_64bit] != 0)
9447             {
9448               int first, second;
9449               char *tmpbuf, *past_reloc;
9450
9451               *rel = gotrel[j].rel[object_64bit];
9452               if (adjust)
9453                 *adjust = len;
9454
9455               if (types)
9456                 {
9457                   if (flag_code != CODE_64BIT)
9458                     {
9459                       types->bitfield.imm32 = 1;
9460                       types->bitfield.disp32 = 1;
9461                     }
9462                   else
9463                     *types = gotrel[j].types64;
9464                 }
9465
9466               /* The length of the first part of our input line.  */
9467               first = cp - input_line_pointer;
9468
9469               /* The second part goes from after the reloc token until
9470                  (and including) an end_of_line char or comma.  */
9471               past_reloc = cp + 1 + len;
9472               cp = past_reloc;
9473               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9474                 ++cp;
9475               second = cp + 1 - past_reloc;
9476
9477               /* Allocate and copy string.  The trailing NUL shouldn't
9478                  be necessary, but be safe.  */
9479               tmpbuf = XNEWVEC (char, first + second + 2);
9480               memcpy (tmpbuf, input_line_pointer, first);
9481               if (second != 0 && *past_reloc != ' ')
9482                 /* Replace the relocation token with ' ', so that
9483                    errors like foo@SECLREL321 will be detected.  */
9484                 tmpbuf[first++] = ' ';
9485               memcpy (tmpbuf + first, past_reloc, second);
9486               tmpbuf[first + second] = '\0';
9487               return tmpbuf;
9488             }
9489
9490           as_bad (_("@%s reloc is not supported with %d-bit output format"),
9491                   gotrel[j].str, 1 << (5 + object_64bit));
9492           return NULL;
9493         }
9494     }
9495
9496   /* Might be a symbol version string.  Don't as_bad here.  */
9497   return NULL;
9498 }
9499
9500 #endif /* TE_PE */
9501
9502 bfd_reloc_code_real_type
9503 x86_cons (expressionS *exp, int size)
9504 {
9505   bfd_reloc_code_real_type got_reloc = NO_RELOC;
9506
9507   intel_syntax = -intel_syntax;
9508
9509   exp->X_md = 0;
9510   if (size == 4 || (object_64bit && size == 8))
9511     {
9512       /* Handle @GOTOFF and the like in an expression.  */
9513       char *save;
9514       char *gotfree_input_line;
9515       int adjust = 0;
9516
9517       save = input_line_pointer;
9518       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9519       if (gotfree_input_line)
9520         input_line_pointer = gotfree_input_line;
9521
9522       expression (exp);
9523
9524       if (gotfree_input_line)
9525         {
9526           /* expression () has merrily parsed up to the end of line,
9527              or a comma - in the wrong buffer.  Transfer how far
9528              input_line_pointer has moved to the right buffer.  */
9529           input_line_pointer = (save
9530                                 + (input_line_pointer - gotfree_input_line)
9531                                 + adjust);
9532           free (gotfree_input_line);
9533           if (exp->X_op == O_constant
9534               || exp->X_op == O_absent
9535               || exp->X_op == O_illegal
9536               || exp->X_op == O_register
9537               || exp->X_op == O_big)
9538             {
9539               char c = *input_line_pointer;
9540               *input_line_pointer = 0;
9541               as_bad (_("missing or invalid expression `%s'"), save);
9542               *input_line_pointer = c;
9543             }
9544           else if ((got_reloc == BFD_RELOC_386_PLT32
9545                     || got_reloc == BFD_RELOC_X86_64_PLT32)
9546                    && exp->X_op != O_symbol)
9547             {
9548               char c = *input_line_pointer;
9549               *input_line_pointer = 0;
9550               as_bad (_("invalid PLT expression `%s'"), save);
9551               *input_line_pointer = c;
9552             }
9553         }
9554     }
9555   else
9556     expression (exp);
9557
9558   intel_syntax = -intel_syntax;
9559
9560   if (intel_syntax)
9561     i386_intel_simplify (exp);
9562
9563   return got_reloc;
9564 }
9565
9566 static void
9567 signed_cons (int size)
9568 {
9569   if (flag_code == CODE_64BIT)
9570     cons_sign = 1;
9571   cons (size);
9572   cons_sign = -1;
9573 }
9574
9575 #ifdef TE_PE
9576 static void
9577 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9578 {
9579   expressionS exp;
9580
9581   do
9582     {
9583       expression (&exp);
9584       if (exp.X_op == O_symbol)
9585         exp.X_op = O_secrel;
9586
9587       emit_expr (&exp, 4);
9588     }
9589   while (*input_line_pointer++ == ',');
9590
9591   input_line_pointer--;
9592   demand_empty_rest_of_line ();
9593 }
9594 #endif
9595
9596 /* Handle Vector operations.  */
9597
9598 static char *
9599 check_VecOperations (char *op_string, char *op_end)
9600 {
9601   const reg_entry *mask;
9602   const char *saved;
9603   char *end_op;
9604
9605   while (*op_string
9606          && (op_end == NULL || op_string < op_end))
9607     {
9608       saved = op_string;
9609       if (*op_string == '{')
9610         {
9611           op_string++;
9612
9613           /* Check broadcasts.  */
9614           if (strncmp (op_string, "1to", 3) == 0)
9615             {
9616               int bcst_type;
9617
9618               if (i.broadcast)
9619                 goto duplicated_vec_op;
9620
9621               op_string += 3;
9622               if (*op_string == '8')
9623                 bcst_type = 8;
9624               else if (*op_string == '4')
9625                 bcst_type = 4;
9626               else if (*op_string == '2')
9627                 bcst_type = 2;
9628               else if (*op_string == '1'
9629                        && *(op_string+1) == '6')
9630                 {
9631                   bcst_type = 16;
9632                   op_string++;
9633                 }
9634               else
9635                 {
9636                   as_bad (_("Unsupported broadcast: `%s'"), saved);
9637                   return NULL;
9638                 }
9639               op_string++;
9640
9641               broadcast_op.type = bcst_type;
9642               broadcast_op.operand = this_operand;
9643               broadcast_op.bytes = 0;
9644               i.broadcast = &broadcast_op;
9645             }
9646           /* Check masking operation.  */
9647           else if ((mask = parse_register (op_string, &end_op)) != NULL)
9648             {
9649               /* k0 can't be used for write mask.  */
9650               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9651                 {
9652                   as_bad (_("`%s%s' can't be used for write mask"),
9653                           register_prefix, mask->reg_name);
9654                   return NULL;
9655                 }
9656
9657               if (!i.mask)
9658                 {
9659                   mask_op.mask = mask;
9660                   mask_op.zeroing = 0;
9661                   mask_op.operand = this_operand;
9662                   i.mask = &mask_op;
9663                 }
9664               else
9665                 {
9666                   if (i.mask->mask)
9667                     goto duplicated_vec_op;
9668
9669                   i.mask->mask = mask;
9670
9671                   /* Only "{z}" is allowed here.  No need to check
9672                      zeroing mask explicitly.  */
9673                   if (i.mask->operand != this_operand)
9674                     {
9675                       as_bad (_("invalid write mask `%s'"), saved);
9676                       return NULL;
9677                     }
9678                 }
9679
9680               op_string = end_op;
9681             }
9682           /* Check zeroing-flag for masking operation.  */
9683           else if (*op_string == 'z')
9684             {
9685               if (!i.mask)
9686                 {
9687                   mask_op.mask = NULL;
9688                   mask_op.zeroing = 1;
9689                   mask_op.operand = this_operand;
9690                   i.mask = &mask_op;
9691                 }
9692               else
9693                 {
9694                   if (i.mask->zeroing)
9695                     {
9696                     duplicated_vec_op:
9697                       as_bad (_("duplicated `%s'"), saved);
9698                       return NULL;
9699                     }
9700
9701                   i.mask->zeroing = 1;
9702
9703                   /* Only "{%k}" is allowed here.  No need to check mask
9704                      register explicitly.  */
9705                   if (i.mask->operand != this_operand)
9706                     {
9707                       as_bad (_("invalid zeroing-masking `%s'"),
9708                               saved);
9709                       return NULL;
9710                     }
9711                 }
9712
9713               op_string++;
9714             }
9715           else
9716             goto unknown_vec_op;
9717
9718           if (*op_string != '}')
9719             {
9720               as_bad (_("missing `}' in `%s'"), saved);
9721               return NULL;
9722             }
9723           op_string++;
9724
9725           /* Strip whitespace since the addition of pseudo prefixes
9726              changed how the scrubber treats '{'.  */
9727           if (is_space_char (*op_string))
9728             ++op_string;
9729
9730           continue;
9731         }
9732     unknown_vec_op:
9733       /* We don't know this one.  */
9734       as_bad (_("unknown vector operation: `%s'"), saved);
9735       return NULL;
9736     }
9737
9738   if (i.mask && i.mask->zeroing && !i.mask->mask)
9739     {
9740       as_bad (_("zeroing-masking only allowed with write mask"));
9741       return NULL;
9742     }
9743
9744   return op_string;
9745 }
9746
9747 static int
9748 i386_immediate (char *imm_start)
9749 {
9750   char *save_input_line_pointer;
9751   char *gotfree_input_line;
9752   segT exp_seg = 0;
9753   expressionS *exp;
9754   i386_operand_type types;
9755
9756   operand_type_set (&types, ~0);
9757
9758   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9759     {
9760       as_bad (_("at most %d immediate operands are allowed"),
9761               MAX_IMMEDIATE_OPERANDS);
9762       return 0;
9763     }
9764
9765   exp = &im_expressions[i.imm_operands++];
9766   i.op[this_operand].imms = exp;
9767
9768   if (is_space_char (*imm_start))
9769     ++imm_start;
9770
9771   save_input_line_pointer = input_line_pointer;
9772   input_line_pointer = imm_start;
9773
9774   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9775   if (gotfree_input_line)
9776     input_line_pointer = gotfree_input_line;
9777
9778   exp_seg = expression (exp);
9779
9780   SKIP_WHITESPACE ();
9781
9782   /* Handle vector operations.  */
9783   if (*input_line_pointer == '{')
9784     {
9785       input_line_pointer = check_VecOperations (input_line_pointer,
9786                                                 NULL);
9787       if (input_line_pointer == NULL)
9788         return 0;
9789     }
9790
9791   if (*input_line_pointer)
9792     as_bad (_("junk `%s' after expression"), input_line_pointer);
9793
9794   input_line_pointer = save_input_line_pointer;
9795   if (gotfree_input_line)
9796     {
9797       free (gotfree_input_line);
9798
9799       if (exp->X_op == O_constant || exp->X_op == O_register)
9800         exp->X_op = O_illegal;
9801     }
9802
9803   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9804 }
9805
9806 static int
9807 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9808                          i386_operand_type types, const char *imm_start)
9809 {
9810   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9811     {
9812       if (imm_start)
9813         as_bad (_("missing or invalid immediate expression `%s'"),
9814                 imm_start);
9815       return 0;
9816     }
9817   else if (exp->X_op == O_constant)
9818     {
9819       /* Size it properly later.  */
9820       i.types[this_operand].bitfield.imm64 = 1;
9821       /* If not 64bit, sign extend val.  */
9822       if (flag_code != CODE_64BIT
9823           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9824         exp->X_add_number
9825           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9826     }
9827 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9828   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9829            && exp_seg != absolute_section
9830            && exp_seg != text_section
9831            && exp_seg != data_section
9832            && exp_seg != bss_section
9833            && exp_seg != undefined_section
9834            && !bfd_is_com_section (exp_seg))
9835     {
9836       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9837       return 0;
9838     }
9839 #endif
9840   else if (!intel_syntax && exp_seg == reg_section)
9841     {
9842       if (imm_start)
9843         as_bad (_("illegal immediate register operand %s"), imm_start);
9844       return 0;
9845     }
9846   else
9847     {
9848       /* This is an address.  The size of the address will be
9849          determined later, depending on destination register,
9850          suffix, or the default for the section.  */
9851       i.types[this_operand].bitfield.imm8 = 1;
9852       i.types[this_operand].bitfield.imm16 = 1;
9853       i.types[this_operand].bitfield.imm32 = 1;
9854       i.types[this_operand].bitfield.imm32s = 1;
9855       i.types[this_operand].bitfield.imm64 = 1;
9856       i.types[this_operand] = operand_type_and (i.types[this_operand],
9857                                                 types);
9858     }
9859
9860   return 1;
9861 }
9862
9863 static char *
9864 i386_scale (char *scale)
9865 {
9866   offsetT val;
9867   char *save = input_line_pointer;
9868
9869   input_line_pointer = scale;
9870   val = get_absolute_expression ();
9871
9872   switch (val)
9873     {
9874     case 1:
9875       i.log2_scale_factor = 0;
9876       break;
9877     case 2:
9878       i.log2_scale_factor = 1;
9879       break;
9880     case 4:
9881       i.log2_scale_factor = 2;
9882       break;
9883     case 8:
9884       i.log2_scale_factor = 3;
9885       break;
9886     default:
9887       {
9888         char sep = *input_line_pointer;
9889
9890         *input_line_pointer = '\0';
9891         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9892                 scale);
9893         *input_line_pointer = sep;
9894         input_line_pointer = save;
9895         return NULL;
9896       }
9897     }
9898   if (i.log2_scale_factor != 0 && i.index_reg == 0)
9899     {
9900       as_warn (_("scale factor of %d without an index register"),
9901                1 << i.log2_scale_factor);
9902       i.log2_scale_factor = 0;
9903     }
9904   scale = input_line_pointer;
9905   input_line_pointer = save;
9906   return scale;
9907 }
9908
9909 static int
9910 i386_displacement (char *disp_start, char *disp_end)
9911 {
9912   expressionS *exp;
9913   segT exp_seg = 0;
9914   char *save_input_line_pointer;
9915   char *gotfree_input_line;
9916   int override;
9917   i386_operand_type bigdisp, types = anydisp;
9918   int ret;
9919
9920   if (i.disp_operands == MAX_MEMORY_OPERANDS)
9921     {
9922       as_bad (_("at most %d displacement operands are allowed"),
9923               MAX_MEMORY_OPERANDS);
9924       return 0;
9925     }
9926
9927   operand_type_set (&bigdisp, 0);
9928   if (i.jumpabsolute
9929       || i.types[this_operand].bitfield.baseindex
9930       || (current_templates->start->opcode_modifier.jump != JUMP
9931           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9932     {
9933       i386_addressing_mode ();
9934       override = (i.prefix[ADDR_PREFIX] != 0);
9935       if (flag_code == CODE_64BIT)
9936         {
9937           if (!override)
9938             {
9939               bigdisp.bitfield.disp32s = 1;
9940               bigdisp.bitfield.disp64 = 1;
9941             }
9942           else
9943             bigdisp.bitfield.disp32 = 1;
9944         }
9945       else if ((flag_code == CODE_16BIT) ^ override)
9946           bigdisp.bitfield.disp16 = 1;
9947       else
9948           bigdisp.bitfield.disp32 = 1;
9949     }
9950   else
9951     {
9952       /* For PC-relative branches, the width of the displacement may be
9953          dependent upon data size, but is never dependent upon address size.
9954          Also make sure to not unintentionally match against a non-PC-relative
9955          branch template.  */
9956       static templates aux_templates;
9957       const insn_template *t = current_templates->start;
9958       bfd_boolean has_intel64 = FALSE;
9959
9960       aux_templates.start = t;
9961       while (++t < current_templates->end)
9962         {
9963           if (t->opcode_modifier.jump
9964               != current_templates->start->opcode_modifier.jump)
9965             break;
9966           if (t->opcode_modifier.intel64)
9967             has_intel64 = TRUE;
9968         }
9969       if (t < current_templates->end)
9970         {
9971           aux_templates.end = t;
9972           current_templates = &aux_templates;
9973         }
9974
9975       override = (i.prefix[DATA_PREFIX] != 0);
9976       if (flag_code == CODE_64BIT)
9977         {
9978           if ((override || i.suffix == WORD_MNEM_SUFFIX)
9979               && (!intel64 || !has_intel64))
9980             bigdisp.bitfield.disp16 = 1;
9981           else
9982             bigdisp.bitfield.disp32s = 1;
9983         }
9984       else
9985         {
9986           if (!override)
9987             override = (i.suffix == (flag_code != CODE_16BIT
9988                                      ? WORD_MNEM_SUFFIX
9989                                      : LONG_MNEM_SUFFIX));
9990           bigdisp.bitfield.disp32 = 1;
9991           if ((flag_code == CODE_16BIT) ^ override)
9992             {
9993               bigdisp.bitfield.disp32 = 0;
9994               bigdisp.bitfield.disp16 = 1;
9995             }
9996         }
9997     }
9998   i.types[this_operand] = operand_type_or (i.types[this_operand],
9999                                            bigdisp);
10000
10001   exp = &disp_expressions[i.disp_operands];
10002   i.op[this_operand].disps = exp;
10003   i.disp_operands++;
10004   save_input_line_pointer = input_line_pointer;
10005   input_line_pointer = disp_start;
10006   END_STRING_AND_SAVE (disp_end);
10007
10008 #ifndef GCC_ASM_O_HACK
10009 #define GCC_ASM_O_HACK 0
10010 #endif
10011 #if GCC_ASM_O_HACK
10012   END_STRING_AND_SAVE (disp_end + 1);
10013   if (i.types[this_operand].bitfield.baseIndex
10014       && displacement_string_end[-1] == '+')
10015     {
10016       /* This hack is to avoid a warning when using the "o"
10017          constraint within gcc asm statements.
10018          For instance:
10019
10020          #define _set_tssldt_desc(n,addr,limit,type) \
10021          __asm__ __volatile__ ( \
10022          "movw %w2,%0\n\t" \
10023          "movw %w1,2+%0\n\t" \
10024          "rorl $16,%1\n\t" \
10025          "movb %b1,4+%0\n\t" \
10026          "movb %4,5+%0\n\t" \
10027          "movb $0,6+%0\n\t" \
10028          "movb %h1,7+%0\n\t" \
10029          "rorl $16,%1" \
10030          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10031
10032          This works great except that the output assembler ends
10033          up looking a bit weird if it turns out that there is
10034          no offset.  You end up producing code that looks like:
10035
10036          #APP
10037          movw $235,(%eax)
10038          movw %dx,2+(%eax)
10039          rorl $16,%edx
10040          movb %dl,4+(%eax)
10041          movb $137,5+(%eax)
10042          movb $0,6+(%eax)
10043          movb %dh,7+(%eax)
10044          rorl $16,%edx
10045          #NO_APP
10046
10047          So here we provide the missing zero.  */
10048
10049       *displacement_string_end = '0';
10050     }
10051 #endif
10052   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10053   if (gotfree_input_line)
10054     input_line_pointer = gotfree_input_line;
10055
10056   exp_seg = expression (exp);
10057
10058   SKIP_WHITESPACE ();
10059   if (*input_line_pointer)
10060     as_bad (_("junk `%s' after expression"), input_line_pointer);
10061 #if GCC_ASM_O_HACK
10062   RESTORE_END_STRING (disp_end + 1);
10063 #endif
10064   input_line_pointer = save_input_line_pointer;
10065   if (gotfree_input_line)
10066     {
10067       free (gotfree_input_line);
10068
10069       if (exp->X_op == O_constant || exp->X_op == O_register)
10070         exp->X_op = O_illegal;
10071     }
10072
10073   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10074
10075   RESTORE_END_STRING (disp_end);
10076
10077   return ret;
10078 }
10079
10080 static int
10081 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10082                             i386_operand_type types, const char *disp_start)
10083 {
10084   i386_operand_type bigdisp;
10085   int ret = 1;
10086
10087   /* We do this to make sure that the section symbol is in
10088      the symbol table.  We will ultimately change the relocation
10089      to be relative to the beginning of the section.  */
10090   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10091       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10092       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10093     {
10094       if (exp->X_op != O_symbol)
10095         goto inv_disp;
10096
10097       if (S_IS_LOCAL (exp->X_add_symbol)
10098           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10099           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10100         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10101       exp->X_op = O_subtract;
10102       exp->X_op_symbol = GOT_symbol;
10103       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10104         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10105       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10106         i.reloc[this_operand] = BFD_RELOC_64;
10107       else
10108         i.reloc[this_operand] = BFD_RELOC_32;
10109     }
10110
10111   else if (exp->X_op == O_absent
10112            || exp->X_op == O_illegal
10113            || exp->X_op == O_big)
10114     {
10115     inv_disp:
10116       as_bad (_("missing or invalid displacement expression `%s'"),
10117               disp_start);
10118       ret = 0;
10119     }
10120
10121   else if (flag_code == CODE_64BIT
10122            && !i.prefix[ADDR_PREFIX]
10123            && exp->X_op == O_constant)
10124     {
10125       /* Since displacement is signed extended to 64bit, don't allow
10126          disp32 and turn off disp32s if they are out of range.  */
10127       i.types[this_operand].bitfield.disp32 = 0;
10128       if (!fits_in_signed_long (exp->X_add_number))
10129         {
10130           i.types[this_operand].bitfield.disp32s = 0;
10131           if (i.types[this_operand].bitfield.baseindex)
10132             {
10133               as_bad (_("0x%lx out range of signed 32bit displacement"),
10134                       (long) exp->X_add_number);
10135               ret = 0;
10136             }
10137         }
10138     }
10139
10140 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10141   else if (exp->X_op != O_constant
10142            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10143            && exp_seg != absolute_section
10144            && exp_seg != text_section
10145            && exp_seg != data_section
10146            && exp_seg != bss_section
10147            && exp_seg != undefined_section
10148            && !bfd_is_com_section (exp_seg))
10149     {
10150       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10151       ret = 0;
10152     }
10153 #endif
10154
10155   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10156       /* Constants get taken care of by optimize_disp().  */
10157       && exp->X_op != O_constant)
10158     i.types[this_operand].bitfield.disp8 = 1;
10159
10160   /* Check if this is a displacement only operand.  */
10161   bigdisp = i.types[this_operand];
10162   bigdisp.bitfield.disp8 = 0;
10163   bigdisp.bitfield.disp16 = 0;
10164   bigdisp.bitfield.disp32 = 0;
10165   bigdisp.bitfield.disp32s = 0;
10166   bigdisp.bitfield.disp64 = 0;
10167   if (operand_type_all_zero (&bigdisp))
10168     i.types[this_operand] = operand_type_and (i.types[this_operand],
10169                                               types);
10170
10171   return ret;
10172 }
10173
10174 /* Return the active addressing mode, taking address override and
10175    registers forming the address into consideration.  Update the
10176    address override prefix if necessary.  */
10177
10178 static enum flag_code
10179 i386_addressing_mode (void)
10180 {
10181   enum flag_code addr_mode;
10182
10183   if (i.prefix[ADDR_PREFIX])
10184     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10185   else
10186     {
10187       addr_mode = flag_code;
10188
10189 #if INFER_ADDR_PREFIX
10190       if (i.mem_operands == 0)
10191         {
10192           /* Infer address prefix from the first memory operand.  */
10193           const reg_entry *addr_reg = i.base_reg;
10194
10195           if (addr_reg == NULL)
10196             addr_reg = i.index_reg;
10197
10198           if (addr_reg)
10199             {
10200               if (addr_reg->reg_type.bitfield.dword)
10201                 addr_mode = CODE_32BIT;
10202               else if (flag_code != CODE_64BIT
10203                        && addr_reg->reg_type.bitfield.word)
10204                 addr_mode = CODE_16BIT;
10205
10206               if (addr_mode != flag_code)
10207                 {
10208                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10209                   i.prefixes += 1;
10210                   /* Change the size of any displacement too.  At most one
10211                      of Disp16 or Disp32 is set.
10212                      FIXME.  There doesn't seem to be any real need for
10213                      separate Disp16 and Disp32 flags.  The same goes for
10214                      Imm16 and Imm32.  Removing them would probably clean
10215                      up the code quite a lot.  */
10216                   if (flag_code != CODE_64BIT
10217                       && (i.types[this_operand].bitfield.disp16
10218                           || i.types[this_operand].bitfield.disp32))
10219                     i.types[this_operand]
10220                       = operand_type_xor (i.types[this_operand], disp16_32);
10221                 }
10222             }
10223         }
10224 #endif
10225     }
10226
10227   return addr_mode;
10228 }
10229
10230 /* Make sure the memory operand we've been dealt is valid.
10231    Return 1 on success, 0 on a failure.  */
10232
10233 static int
10234 i386_index_check (const char *operand_string)
10235 {
10236   const char *kind = "base/index";
10237   enum flag_code addr_mode = i386_addressing_mode ();
10238
10239   if (current_templates->start->opcode_modifier.isstring
10240       && !current_templates->start->cpu_flags.bitfield.cpupadlock
10241       && (current_templates->end[-1].opcode_modifier.isstring
10242           || i.mem_operands))
10243     {
10244       /* Memory operands of string insns are special in that they only allow
10245          a single register (rDI, rSI, or rBX) as their memory address.  */
10246       const reg_entry *expected_reg;
10247       static const char *di_si[][2] =
10248         {
10249           { "esi", "edi" },
10250           { "si", "di" },
10251           { "rsi", "rdi" }
10252         };
10253       static const char *bx[] = { "ebx", "bx", "rbx" };
10254
10255       kind = "string address";
10256
10257       if (current_templates->start->opcode_modifier.repprefixok)
10258         {
10259           int es_op = current_templates->end[-1].opcode_modifier.isstring
10260                       - IS_STRING_ES_OP0;
10261           int op = 0;
10262
10263           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10264               || ((!i.mem_operands != !intel_syntax)
10265                   && current_templates->end[-1].operand_types[1]
10266                      .bitfield.baseindex))
10267             op = 1;
10268           expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10269         }
10270       else
10271         expected_reg = hash_find (reg_hash, bx[addr_mode]);
10272
10273       if (i.base_reg != expected_reg
10274           || i.index_reg
10275           || operand_type_check (i.types[this_operand], disp))
10276         {
10277           /* The second memory operand must have the same size as
10278              the first one.  */
10279           if (i.mem_operands
10280               && i.base_reg
10281               && !((addr_mode == CODE_64BIT
10282                     && i.base_reg->reg_type.bitfield.qword)
10283                    || (addr_mode == CODE_32BIT
10284                        ? i.base_reg->reg_type.bitfield.dword
10285                        : i.base_reg->reg_type.bitfield.word)))
10286             goto bad_address;
10287
10288           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10289                    operand_string,
10290                    intel_syntax ? '[' : '(',
10291                    register_prefix,
10292                    expected_reg->reg_name,
10293                    intel_syntax ? ']' : ')');
10294           return 1;
10295         }
10296       else
10297         return 1;
10298
10299 bad_address:
10300       as_bad (_("`%s' is not a valid %s expression"),
10301               operand_string, kind);
10302       return 0;
10303     }
10304   else
10305     {
10306       if (addr_mode != CODE_16BIT)
10307         {
10308           /* 32-bit/64-bit checks.  */
10309           if ((i.base_reg
10310                && ((addr_mode == CODE_64BIT
10311                     ? !i.base_reg->reg_type.bitfield.qword
10312                     : !i.base_reg->reg_type.bitfield.dword)
10313                    || (i.index_reg && i.base_reg->reg_num == RegIP)
10314                    || i.base_reg->reg_num == RegIZ))
10315               || (i.index_reg
10316                   && !i.index_reg->reg_type.bitfield.xmmword
10317                   && !i.index_reg->reg_type.bitfield.ymmword
10318                   && !i.index_reg->reg_type.bitfield.zmmword
10319                   && ((addr_mode == CODE_64BIT
10320                        ? !i.index_reg->reg_type.bitfield.qword
10321                        : !i.index_reg->reg_type.bitfield.dword)
10322                       || !i.index_reg->reg_type.bitfield.baseindex)))
10323             goto bad_address;
10324
10325           /* bndmk, bndldx, and bndstx have special restrictions. */
10326           if (current_templates->start->base_opcode == 0xf30f1b
10327               || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10328             {
10329               /* They cannot use RIP-relative addressing. */
10330               if (i.base_reg && i.base_reg->reg_num == RegIP)
10331                 {
10332                   as_bad (_("`%s' cannot be used here"), operand_string);
10333                   return 0;
10334                 }
10335
10336               /* bndldx and bndstx ignore their scale factor. */
10337               if (current_templates->start->base_opcode != 0xf30f1b
10338                   && i.log2_scale_factor)
10339                 as_warn (_("register scaling is being ignored here"));
10340             }
10341         }
10342       else
10343         {
10344           /* 16-bit checks.  */
10345           if ((i.base_reg
10346                && (!i.base_reg->reg_type.bitfield.word
10347                    || !i.base_reg->reg_type.bitfield.baseindex))
10348               || (i.index_reg
10349                   && (!i.index_reg->reg_type.bitfield.word
10350                       || !i.index_reg->reg_type.bitfield.baseindex
10351                       || !(i.base_reg
10352                            && i.base_reg->reg_num < 6
10353                            && i.index_reg->reg_num >= 6
10354                            && i.log2_scale_factor == 0))))
10355             goto bad_address;
10356         }
10357     }
10358   return 1;
10359 }
10360
10361 /* Handle vector immediates.  */
10362
10363 static int
10364 RC_SAE_immediate (const char *imm_start)
10365 {
10366   unsigned int match_found, j;
10367   const char *pstr = imm_start;
10368   expressionS *exp;
10369
10370   if (*pstr != '{')
10371     return 0;
10372
10373   pstr++;
10374   match_found = 0;
10375   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10376     {
10377       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10378         {
10379           if (!i.rounding)
10380             {
10381               rc_op.type = RC_NamesTable[j].type;
10382               rc_op.operand = this_operand;
10383               i.rounding = &rc_op;
10384             }
10385           else
10386             {
10387               as_bad (_("duplicated `%s'"), imm_start);
10388               return 0;
10389             }
10390           pstr += RC_NamesTable[j].len;
10391           match_found = 1;
10392           break;
10393         }
10394     }
10395   if (!match_found)
10396     return 0;
10397
10398   if (*pstr++ != '}')
10399     {
10400       as_bad (_("Missing '}': '%s'"), imm_start);
10401       return 0;
10402     }
10403   /* RC/SAE immediate string should contain nothing more.  */;
10404   if (*pstr != 0)
10405     {
10406       as_bad (_("Junk after '}': '%s'"), imm_start);
10407       return 0;
10408     }
10409
10410   exp = &im_expressions[i.imm_operands++];
10411   i.op[this_operand].imms = exp;
10412
10413   exp->X_op = O_constant;
10414   exp->X_add_number = 0;
10415   exp->X_add_symbol = (symbolS *) 0;
10416   exp->X_op_symbol = (symbolS *) 0;
10417
10418   i.types[this_operand].bitfield.imm8 = 1;
10419   return 1;
10420 }
10421
10422 /* Only string instructions can have a second memory operand, so
10423    reduce current_templates to just those if it contains any.  */
10424 static int
10425 maybe_adjust_templates (void)
10426 {
10427   const insn_template *t;
10428
10429   gas_assert (i.mem_operands == 1);
10430
10431   for (t = current_templates->start; t < current_templates->end; ++t)
10432     if (t->opcode_modifier.isstring)
10433       break;
10434
10435   if (t < current_templates->end)
10436     {
10437       static templates aux_templates;
10438       bfd_boolean recheck;
10439
10440       aux_templates.start = t;
10441       for (; t < current_templates->end; ++t)
10442         if (!t->opcode_modifier.isstring)
10443           break;
10444       aux_templates.end = t;
10445
10446       /* Determine whether to re-check the first memory operand.  */
10447       recheck = (aux_templates.start != current_templates->start
10448                  || t != current_templates->end);
10449
10450       current_templates = &aux_templates;
10451
10452       if (recheck)
10453         {
10454           i.mem_operands = 0;
10455           if (i.memop1_string != NULL
10456               && i386_index_check (i.memop1_string) == 0)
10457             return 0;
10458           i.mem_operands = 1;
10459         }
10460     }
10461
10462   return 1;
10463 }
10464
10465 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
10466    on error.  */
10467
10468 static int
10469 i386_att_operand (char *operand_string)
10470 {
10471   const reg_entry *r;
10472   char *end_op;
10473   char *op_string = operand_string;
10474
10475   if (is_space_char (*op_string))
10476     ++op_string;
10477
10478   /* We check for an absolute prefix (differentiating,
10479      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
10480   if (*op_string == ABSOLUTE_PREFIX)
10481     {
10482       ++op_string;
10483       if (is_space_char (*op_string))
10484         ++op_string;
10485       i.jumpabsolute = TRUE;
10486     }
10487
10488   /* Check if operand is a register.  */
10489   if ((r = parse_register (op_string, &end_op)) != NULL)
10490     {
10491       i386_operand_type temp;
10492
10493       /* Check for a segment override by searching for ':' after a
10494          segment register.  */
10495       op_string = end_op;
10496       if (is_space_char (*op_string))
10497         ++op_string;
10498       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10499         {
10500           switch (r->reg_num)
10501             {
10502             case 0:
10503               i.seg[i.mem_operands] = &es;
10504               break;
10505             case 1:
10506               i.seg[i.mem_operands] = &cs;
10507               break;
10508             case 2:
10509               i.seg[i.mem_operands] = &ss;
10510               break;
10511             case 3:
10512               i.seg[i.mem_operands] = &ds;
10513               break;
10514             case 4:
10515               i.seg[i.mem_operands] = &fs;
10516               break;
10517             case 5:
10518               i.seg[i.mem_operands] = &gs;
10519               break;
10520             }
10521
10522           /* Skip the ':' and whitespace.  */
10523           ++op_string;
10524           if (is_space_char (*op_string))
10525             ++op_string;
10526
10527           if (!is_digit_char (*op_string)
10528               && !is_identifier_char (*op_string)
10529               && *op_string != '('
10530               && *op_string != ABSOLUTE_PREFIX)
10531             {
10532               as_bad (_("bad memory operand `%s'"), op_string);
10533               return 0;
10534             }
10535           /* Handle case of %es:*foo.  */
10536           if (*op_string == ABSOLUTE_PREFIX)
10537             {
10538               ++op_string;
10539               if (is_space_char (*op_string))
10540                 ++op_string;
10541               i.jumpabsolute = TRUE;
10542             }
10543           goto do_memory_reference;
10544         }
10545
10546       /* Handle vector operations.  */
10547       if (*op_string == '{')
10548         {
10549           op_string = check_VecOperations (op_string, NULL);
10550           if (op_string == NULL)
10551             return 0;
10552         }
10553
10554       if (*op_string)
10555         {
10556           as_bad (_("junk `%s' after register"), op_string);
10557           return 0;
10558         }
10559       temp = r->reg_type;
10560       temp.bitfield.baseindex = 0;
10561       i.types[this_operand] = operand_type_or (i.types[this_operand],
10562                                                temp);
10563       i.types[this_operand].bitfield.unspecified = 0;
10564       i.op[this_operand].regs = r;
10565       i.reg_operands++;
10566     }
10567   else if (*op_string == REGISTER_PREFIX)
10568     {
10569       as_bad (_("bad register name `%s'"), op_string);
10570       return 0;
10571     }
10572   else if (*op_string == IMMEDIATE_PREFIX)
10573     {
10574       ++op_string;
10575       if (i.jumpabsolute)
10576         {
10577           as_bad (_("immediate operand illegal with absolute jump"));
10578           return 0;
10579         }
10580       if (!i386_immediate (op_string))
10581         return 0;
10582     }
10583   else if (RC_SAE_immediate (operand_string))
10584     {
10585       /* If it is a RC or SAE immediate, do nothing.  */
10586       ;
10587     }
10588   else if (is_digit_char (*op_string)
10589            || is_identifier_char (*op_string)
10590            || *op_string == '"'
10591            || *op_string == '(')
10592     {
10593       /* This is a memory reference of some sort.  */
10594       char *base_string;
10595
10596       /* Start and end of displacement string expression (if found).  */
10597       char *displacement_string_start;
10598       char *displacement_string_end;
10599       char *vop_start;
10600
10601     do_memory_reference:
10602       if (i.mem_operands == 1 && !maybe_adjust_templates ())
10603         return 0;
10604       if ((i.mem_operands == 1
10605            && !current_templates->start->opcode_modifier.isstring)
10606           || i.mem_operands == 2)
10607         {
10608           as_bad (_("too many memory references for `%s'"),
10609                   current_templates->start->name);
10610           return 0;
10611         }
10612
10613       /* Check for base index form.  We detect the base index form by
10614          looking for an ')' at the end of the operand, searching
10615          for the '(' matching it, and finding a REGISTER_PREFIX or ','
10616          after the '('.  */
10617       base_string = op_string + strlen (op_string);
10618
10619       /* Handle vector operations.  */
10620       vop_start = strchr (op_string, '{');
10621       if (vop_start && vop_start < base_string)
10622         {
10623           if (check_VecOperations (vop_start, base_string) == NULL)
10624             return 0;
10625           base_string = vop_start;
10626         }
10627
10628       --base_string;
10629       if (is_space_char (*base_string))
10630         --base_string;
10631
10632       /* If we only have a displacement, set-up for it to be parsed later.  */
10633       displacement_string_start = op_string;
10634       displacement_string_end = base_string + 1;
10635
10636       if (*base_string == ')')
10637         {
10638           char *temp_string;
10639           unsigned int parens_balanced = 1;
10640           /* We've already checked that the number of left & right ()'s are
10641              equal, so this loop will not be infinite.  */
10642           do
10643             {
10644               base_string--;
10645               if (*base_string == ')')
10646                 parens_balanced++;
10647               if (*base_string == '(')
10648                 parens_balanced--;
10649             }
10650           while (parens_balanced);
10651
10652           temp_string = base_string;
10653
10654           /* Skip past '(' and whitespace.  */
10655           ++base_string;
10656           if (is_space_char (*base_string))
10657             ++base_string;
10658
10659           if (*base_string == ','
10660               || ((i.base_reg = parse_register (base_string, &end_op))
10661                   != NULL))
10662             {
10663               displacement_string_end = temp_string;
10664
10665               i.types[this_operand].bitfield.baseindex = 1;
10666
10667               if (i.base_reg)
10668                 {
10669                   base_string = end_op;
10670                   if (is_space_char (*base_string))
10671                     ++base_string;
10672                 }
10673
10674               /* There may be an index reg or scale factor here.  */
10675               if (*base_string == ',')
10676                 {
10677                   ++base_string;
10678                   if (is_space_char (*base_string))
10679                     ++base_string;
10680
10681                   if ((i.index_reg = parse_register (base_string, &end_op))
10682                       != NULL)
10683                     {
10684                       base_string = end_op;
10685                       if (is_space_char (*base_string))
10686                         ++base_string;
10687                       if (*base_string == ',')
10688                         {
10689                           ++base_string;
10690                           if (is_space_char (*base_string))
10691                             ++base_string;
10692                         }
10693                       else if (*base_string != ')')
10694                         {
10695                           as_bad (_("expecting `,' or `)' "
10696                                     "after index register in `%s'"),
10697                                   operand_string);
10698                           return 0;
10699                         }
10700                     }
10701                   else if (*base_string == REGISTER_PREFIX)
10702                     {
10703                       end_op = strchr (base_string, ',');
10704                       if (end_op)
10705                         *end_op = '\0';
10706                       as_bad (_("bad register name `%s'"), base_string);
10707                       return 0;
10708                     }
10709
10710                   /* Check for scale factor.  */
10711                   if (*base_string != ')')
10712                     {
10713                       char *end_scale = i386_scale (base_string);
10714
10715                       if (!end_scale)
10716                         return 0;
10717
10718                       base_string = end_scale;
10719                       if (is_space_char (*base_string))
10720                         ++base_string;
10721                       if (*base_string != ')')
10722                         {
10723                           as_bad (_("expecting `)' "
10724                                     "after scale factor in `%s'"),
10725                                   operand_string);
10726                           return 0;
10727                         }
10728                     }
10729                   else if (!i.index_reg)
10730                     {
10731                       as_bad (_("expecting index register or scale factor "
10732                                 "after `,'; got '%c'"),
10733                               *base_string);
10734                       return 0;
10735                     }
10736                 }
10737               else if (*base_string != ')')
10738                 {
10739                   as_bad (_("expecting `,' or `)' "
10740                             "after base register in `%s'"),
10741                           operand_string);
10742                   return 0;
10743                 }
10744             }
10745           else if (*base_string == REGISTER_PREFIX)
10746             {
10747               end_op = strchr (base_string, ',');
10748               if (end_op)
10749                 *end_op = '\0';
10750               as_bad (_("bad register name `%s'"), base_string);
10751               return 0;
10752             }
10753         }
10754
10755       /* If there's an expression beginning the operand, parse it,
10756          assuming displacement_string_start and
10757          displacement_string_end are meaningful.  */
10758       if (displacement_string_start != displacement_string_end)
10759         {
10760           if (!i386_displacement (displacement_string_start,
10761                                   displacement_string_end))
10762             return 0;
10763         }
10764
10765       /* Special case for (%dx) while doing input/output op.  */
10766       if (i.base_reg
10767           && i.base_reg->reg_type.bitfield.instance == RegD
10768           && i.base_reg->reg_type.bitfield.word
10769           && i.index_reg == 0
10770           && i.log2_scale_factor == 0
10771           && i.seg[i.mem_operands] == 0
10772           && !operand_type_check (i.types[this_operand], disp))
10773         {
10774           i.types[this_operand] = i.base_reg->reg_type;
10775           return 1;
10776         }
10777
10778       if (i386_index_check (operand_string) == 0)
10779         return 0;
10780       i.flags[this_operand] |= Operand_Mem;
10781       if (i.mem_operands == 0)
10782         i.memop1_string = xstrdup (operand_string);
10783       i.mem_operands++;
10784     }
10785   else
10786     {
10787       /* It's not a memory operand; argh!  */
10788       as_bad (_("invalid char %s beginning operand %d `%s'"),
10789               output_invalid (*op_string),
10790               this_operand + 1,
10791               op_string);
10792       return 0;
10793     }
10794   return 1;                     /* Normal return.  */
10795 }
10796 \f
10797 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10798    that an rs_machine_dependent frag may reach.  */
10799
10800 unsigned int
10801 i386_frag_max_var (fragS *frag)
10802 {
10803   /* The only relaxable frags are for jumps.
10804      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
10805   gas_assert (frag->fr_type == rs_machine_dependent);
10806   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10807 }
10808
10809 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10810 static int
10811 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10812 {
10813   /* STT_GNU_IFUNC symbol must go through PLT.  */
10814   if ((symbol_get_bfdsym (fr_symbol)->flags
10815        & BSF_GNU_INDIRECT_FUNCTION) != 0)
10816     return 0;
10817
10818   if (!S_IS_EXTERNAL (fr_symbol))
10819     /* Symbol may be weak or local.  */
10820     return !S_IS_WEAK (fr_symbol);
10821
10822   /* Global symbols with non-default visibility can't be preempted. */
10823   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10824     return 1;
10825
10826   if (fr_var != NO_RELOC)
10827     switch ((enum bfd_reloc_code_real) fr_var)
10828       {
10829       case BFD_RELOC_386_PLT32:
10830       case BFD_RELOC_X86_64_PLT32:
10831         /* Symbol with PLT relocation may be preempted. */
10832         return 0;
10833       default:
10834         abort ();
10835       }
10836
10837   /* Global symbols with default visibility in a shared library may be
10838      preempted by another definition.  */
10839   return !shared;
10840 }
10841 #endif
10842
10843 /* Return the next non-empty frag.  */
10844
10845 static fragS *
10846 i386_next_non_empty_frag (fragS *fragP)
10847 {
10848   /* There may be a frag with a ".fill 0" when there is no room in
10849      the current frag for frag_grow in output_insn.  */
10850   for (fragP = fragP->fr_next;
10851        (fragP != NULL
10852         && fragP->fr_type == rs_fill
10853         && fragP->fr_fix == 0);
10854        fragP = fragP->fr_next)
10855     ;
10856   return fragP;
10857 }
10858
10859 /* Return the next jcc frag after BRANCH_PADDING.  */
10860
10861 static fragS *
10862 i386_next_jcc_frag (fragS *fragP)
10863 {
10864   if (!fragP)
10865     return NULL;
10866
10867   if (fragP->fr_type == rs_machine_dependent
10868       && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10869           == BRANCH_PADDING))
10870     {
10871       fragP = i386_next_non_empty_frag (fragP);
10872       if (fragP->fr_type != rs_machine_dependent)
10873         return NULL;
10874       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10875         return fragP;
10876     }
10877
10878   return NULL;
10879 }
10880
10881 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
10882
10883 static void
10884 i386_classify_machine_dependent_frag (fragS *fragP)
10885 {
10886   fragS *cmp_fragP;
10887   fragS *pad_fragP;
10888   fragS *branch_fragP;
10889   fragS *next_fragP;
10890   unsigned int max_prefix_length;
10891
10892   if (fragP->tc_frag_data.classified)
10893     return;
10894
10895   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
10896      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
10897   for (next_fragP = fragP;
10898        next_fragP != NULL;
10899        next_fragP = next_fragP->fr_next)
10900     {
10901       next_fragP->tc_frag_data.classified = 1;
10902       if (next_fragP->fr_type == rs_machine_dependent)
10903         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10904           {
10905           case BRANCH_PADDING:
10906             /* The BRANCH_PADDING frag must be followed by a branch
10907                frag.  */
10908             branch_fragP = i386_next_non_empty_frag (next_fragP);
10909             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10910             break;
10911           case FUSED_JCC_PADDING:
10912             /* Check if this is a fused jcc:
10913                FUSED_JCC_PADDING
10914                CMP like instruction
10915                BRANCH_PADDING
10916                COND_JUMP
10917                */
10918             cmp_fragP = i386_next_non_empty_frag (next_fragP);
10919             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10920             branch_fragP = i386_next_jcc_frag (pad_fragP);
10921             if (branch_fragP)
10922               {
10923                 /* The BRANCH_PADDING frag is merged with the
10924                    FUSED_JCC_PADDING frag.  */
10925                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10926                 /* CMP like instruction size.  */
10927                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10928                 frag_wane (pad_fragP);
10929                 /* Skip to branch_fragP.  */
10930                 next_fragP = branch_fragP;
10931               }
10932             else if (next_fragP->tc_frag_data.max_prefix_length)
10933               {
10934                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10935                    a fused jcc.  */
10936                 next_fragP->fr_subtype
10937                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10938                 next_fragP->tc_frag_data.max_bytes
10939                   = next_fragP->tc_frag_data.max_prefix_length;
10940                 /* This will be updated in the BRANCH_PREFIX scan.  */
10941                 next_fragP->tc_frag_data.max_prefix_length = 0;
10942               }
10943             else
10944               frag_wane (next_fragP);
10945             break;
10946           }
10947     }
10948
10949   /* Stop if there is no BRANCH_PREFIX.  */
10950   if (!align_branch_prefix_size)
10951     return;
10952
10953   /* Scan for BRANCH_PREFIX.  */
10954   for (; fragP != NULL; fragP = fragP->fr_next)
10955     {
10956       if (fragP->fr_type != rs_machine_dependent
10957           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10958               != BRANCH_PREFIX))
10959         continue;
10960
10961       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
10962          COND_JUMP_PREFIX.  */
10963       max_prefix_length = 0;
10964       for (next_fragP = fragP;
10965            next_fragP != NULL;
10966            next_fragP = next_fragP->fr_next)
10967         {
10968           if (next_fragP->fr_type == rs_fill)
10969             /* Skip rs_fill frags.  */
10970             continue;
10971           else if (next_fragP->fr_type != rs_machine_dependent)
10972             /* Stop for all other frags.  */
10973             break;
10974
10975           /* rs_machine_dependent frags.  */
10976           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10977               == BRANCH_PREFIX)
10978             {
10979               /* Count BRANCH_PREFIX frags.  */
10980               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
10981                 {
10982                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
10983                   frag_wane (next_fragP);
10984                 }
10985               else
10986                 max_prefix_length
10987                   += next_fragP->tc_frag_data.max_bytes;
10988             }
10989           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10990                     == BRANCH_PADDING)
10991                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10992                        == FUSED_JCC_PADDING))
10993             {
10994               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
10995               fragP->tc_frag_data.u.padding_fragP = next_fragP;
10996               break;
10997             }
10998           else
10999             /* Stop for other rs_machine_dependent frags.  */
11000             break;
11001         }
11002
11003       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11004
11005       /* Skip to the next frag.  */
11006       fragP = next_fragP;
11007     }
11008 }
11009
11010 /* Compute padding size for
11011
11012         FUSED_JCC_PADDING
11013         CMP like instruction
11014         BRANCH_PADDING
11015         COND_JUMP/UNCOND_JUMP
11016
11017    or
11018
11019         BRANCH_PADDING
11020         COND_JUMP/UNCOND_JUMP
11021  */
11022
11023 static int
11024 i386_branch_padding_size (fragS *fragP, offsetT address)
11025 {
11026   unsigned int offset, size, padding_size;
11027   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11028
11029   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11030   if (!address)
11031     address = fragP->fr_address;
11032   address += fragP->fr_fix;
11033
11034   /* CMP like instrunction size.  */
11035   size = fragP->tc_frag_data.cmp_size;
11036
11037   /* The base size of the branch frag.  */
11038   size += branch_fragP->fr_fix;
11039
11040   /* Add opcode and displacement bytes for the rs_machine_dependent
11041      branch frag.  */
11042   if (branch_fragP->fr_type == rs_machine_dependent)
11043     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11044
11045   /* Check if branch is within boundary and doesn't end at the last
11046      byte.  */
11047   offset = address & ((1U << align_branch_power) - 1);
11048   if ((offset + size) >= (1U << align_branch_power))
11049     /* Padding needed to avoid crossing boundary.  */
11050     padding_size = (1U << align_branch_power) - offset;
11051   else
11052     /* No padding needed.  */
11053     padding_size = 0;
11054
11055   /* The return value may be saved in tc_frag_data.length which is
11056      unsigned byte.  */
11057   if (!fits_in_unsigned_byte (padding_size))
11058     abort ();
11059
11060   return padding_size;
11061 }
11062
11063 /* i386_generic_table_relax_frag()
11064
11065    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11066    grow/shrink padding to align branch frags.  Hand others to
11067    relax_frag().  */
11068
11069 long
11070 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11071 {
11072   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11073       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11074     {
11075       long padding_size = i386_branch_padding_size (fragP, 0);
11076       long grow = padding_size - fragP->tc_frag_data.length;
11077
11078       /* When the BRANCH_PREFIX frag is used, the computed address
11079          must match the actual address and there should be no padding.  */
11080       if (fragP->tc_frag_data.padding_address
11081           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11082               || padding_size))
11083         abort ();
11084
11085       /* Update the padding size.  */
11086       if (grow)
11087         fragP->tc_frag_data.length = padding_size;
11088
11089       return grow;
11090     }
11091   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11092     {
11093       fragS *padding_fragP, *next_fragP;
11094       long padding_size, left_size, last_size;
11095
11096       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11097       if (!padding_fragP)
11098         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11099         return (fragP->tc_frag_data.length
11100                 - fragP->tc_frag_data.last_length);
11101
11102       /* Compute the relative address of the padding frag in the very
11103         first time where the BRANCH_PREFIX frag sizes are zero.  */
11104       if (!fragP->tc_frag_data.padding_address)
11105         fragP->tc_frag_data.padding_address
11106           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11107
11108       /* First update the last length from the previous interation.  */
11109       left_size = fragP->tc_frag_data.prefix_length;
11110       for (next_fragP = fragP;
11111            next_fragP != padding_fragP;
11112            next_fragP = next_fragP->fr_next)
11113         if (next_fragP->fr_type == rs_machine_dependent
11114             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11115                 == BRANCH_PREFIX))
11116           {
11117             if (left_size)
11118               {
11119                 int max = next_fragP->tc_frag_data.max_bytes;
11120                 if (max)
11121                   {
11122                     int size;
11123                     if (max > left_size)
11124                       size = left_size;
11125                     else
11126                       size = max;
11127                     left_size -= size;
11128                     next_fragP->tc_frag_data.last_length = size;
11129                   }
11130               }
11131             else
11132               next_fragP->tc_frag_data.last_length = 0;
11133           }
11134
11135       /* Check the padding size for the padding frag.  */
11136       padding_size = i386_branch_padding_size
11137         (padding_fragP, (fragP->fr_address
11138                          + fragP->tc_frag_data.padding_address));
11139
11140       last_size = fragP->tc_frag_data.prefix_length;
11141       /* Check if there is change from the last interation.  */
11142       if (padding_size == last_size)
11143         {
11144           /* Update the expected address of the padding frag.  */
11145           padding_fragP->tc_frag_data.padding_address
11146             = (fragP->fr_address + padding_size
11147                + fragP->tc_frag_data.padding_address);
11148           return 0;
11149         }
11150
11151       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11152         {
11153           /* No padding if there is no sufficient room.  Clear the
11154              expected address of the padding frag.  */
11155           padding_fragP->tc_frag_data.padding_address = 0;
11156           padding_size = 0;
11157         }
11158       else
11159         /* Store the expected address of the padding frag.  */
11160         padding_fragP->tc_frag_data.padding_address
11161           = (fragP->fr_address + padding_size
11162              + fragP->tc_frag_data.padding_address);
11163
11164       fragP->tc_frag_data.prefix_length = padding_size;
11165
11166       /* Update the length for the current interation.  */
11167       left_size = padding_size;
11168       for (next_fragP = fragP;
11169            next_fragP != padding_fragP;
11170            next_fragP = next_fragP->fr_next)
11171         if (next_fragP->fr_type == rs_machine_dependent
11172             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11173                 == BRANCH_PREFIX))
11174           {
11175             if (left_size)
11176               {
11177                 int max = next_fragP->tc_frag_data.max_bytes;
11178                 if (max)
11179                   {
11180                     int size;
11181                     if (max > left_size)
11182                       size = left_size;
11183                     else
11184                       size = max;
11185                     left_size -= size;
11186                     next_fragP->tc_frag_data.length = size;
11187                   }
11188               }
11189             else
11190               next_fragP->tc_frag_data.length = 0;
11191           }
11192
11193       return (fragP->tc_frag_data.length
11194               - fragP->tc_frag_data.last_length);
11195     }
11196   return relax_frag (segment, fragP, stretch);
11197 }
11198
11199 /* md_estimate_size_before_relax()
11200
11201    Called just before relax() for rs_machine_dependent frags.  The x86
11202    assembler uses these frags to handle variable size jump
11203    instructions.
11204
11205    Any symbol that is now undefined will not become defined.
11206    Return the correct fr_subtype in the frag.
11207    Return the initial "guess for variable size of frag" to caller.
11208    The guess is actually the growth beyond the fixed part.  Whatever
11209    we do to grow the fixed or variable part contributes to our
11210    returned value.  */
11211
11212 int
11213 md_estimate_size_before_relax (fragS *fragP, segT segment)
11214 {
11215   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11216       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11217       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11218     {
11219       i386_classify_machine_dependent_frag (fragP);
11220       return fragP->tc_frag_data.length;
11221     }
11222
11223   /* We've already got fragP->fr_subtype right;  all we have to do is
11224      check for un-relaxable symbols.  On an ELF system, we can't relax
11225      an externally visible symbol, because it may be overridden by a
11226      shared library.  */
11227   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11228 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11229       || (IS_ELF
11230           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11231                                                 fragP->fr_var))
11232 #endif
11233 #if defined (OBJ_COFF) && defined (TE_PE)
11234       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11235           && S_IS_WEAK (fragP->fr_symbol))
11236 #endif
11237       )
11238     {
11239       /* Symbol is undefined in this segment, or we need to keep a
11240          reloc so that weak symbols can be overridden.  */
11241       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11242       enum bfd_reloc_code_real reloc_type;
11243       unsigned char *opcode;
11244       int old_fr_fix;
11245
11246       if (fragP->fr_var != NO_RELOC)
11247         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11248       else if (size == 2)
11249         reloc_type = BFD_RELOC_16_PCREL;
11250 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11251       else if (need_plt32_p (fragP->fr_symbol))
11252         reloc_type = BFD_RELOC_X86_64_PLT32;
11253 #endif
11254       else
11255         reloc_type = BFD_RELOC_32_PCREL;
11256
11257       old_fr_fix = fragP->fr_fix;
11258       opcode = (unsigned char *) fragP->fr_opcode;
11259
11260       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11261         {
11262         case UNCOND_JUMP:
11263           /* Make jmp (0xeb) a (d)word displacement jump.  */
11264           opcode[0] = 0xe9;
11265           fragP->fr_fix += size;
11266           fix_new (fragP, old_fr_fix, size,
11267                    fragP->fr_symbol,
11268                    fragP->fr_offset, 1,
11269                    reloc_type);
11270           break;
11271
11272         case COND_JUMP86:
11273           if (size == 2
11274               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11275             {
11276               /* Negate the condition, and branch past an
11277                  unconditional jump.  */
11278               opcode[0] ^= 1;
11279               opcode[1] = 3;
11280               /* Insert an unconditional jump.  */
11281               opcode[2] = 0xe9;
11282               /* We added two extra opcode bytes, and have a two byte
11283                  offset.  */
11284               fragP->fr_fix += 2 + 2;
11285               fix_new (fragP, old_fr_fix + 2, 2,
11286                        fragP->fr_symbol,
11287                        fragP->fr_offset, 1,
11288                        reloc_type);
11289               break;
11290             }
11291           /* Fall through.  */
11292
11293         case COND_JUMP:
11294           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11295             {
11296               fixS *fixP;
11297
11298               fragP->fr_fix += 1;
11299               fixP = fix_new (fragP, old_fr_fix, 1,
11300                               fragP->fr_symbol,
11301                               fragP->fr_offset, 1,
11302                               BFD_RELOC_8_PCREL);
11303               fixP->fx_signed = 1;
11304               break;
11305             }
11306
11307           /* This changes the byte-displacement jump 0x7N
11308              to the (d)word-displacement jump 0x0f,0x8N.  */
11309           opcode[1] = opcode[0] + 0x10;
11310           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11311           /* We've added an opcode byte.  */
11312           fragP->fr_fix += 1 + size;
11313           fix_new (fragP, old_fr_fix + 1, size,
11314                    fragP->fr_symbol,
11315                    fragP->fr_offset, 1,
11316                    reloc_type);
11317           break;
11318
11319         default:
11320           BAD_CASE (fragP->fr_subtype);
11321           break;
11322         }
11323       frag_wane (fragP);
11324       return fragP->fr_fix - old_fr_fix;
11325     }
11326
11327   /* Guess size depending on current relax state.  Initially the relax
11328      state will correspond to a short jump and we return 1, because
11329      the variable part of the frag (the branch offset) is one byte
11330      long.  However, we can relax a section more than once and in that
11331      case we must either set fr_subtype back to the unrelaxed state,
11332      or return the value for the appropriate branch.  */
11333   return md_relax_table[fragP->fr_subtype].rlx_length;
11334 }
11335
11336 /* Called after relax() is finished.
11337
11338    In:  Address of frag.
11339         fr_type == rs_machine_dependent.
11340         fr_subtype is what the address relaxed to.
11341
11342    Out: Any fixSs and constants are set up.
11343         Caller will turn frag into a ".space 0".  */
11344
11345 void
11346 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11347                  fragS *fragP)
11348 {
11349   unsigned char *opcode;
11350   unsigned char *where_to_put_displacement = NULL;
11351   offsetT target_address;
11352   offsetT opcode_address;
11353   unsigned int extension = 0;
11354   offsetT displacement_from_opcode_start;
11355
11356   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11357       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11358       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11359     {
11360       /* Generate nop padding.  */
11361       unsigned int size = fragP->tc_frag_data.length;
11362       if (size)
11363         {
11364           if (size > fragP->tc_frag_data.max_bytes)
11365             abort ();
11366
11367           if (flag_debug)
11368             {
11369               const char *msg;
11370               const char *branch = "branch";
11371               const char *prefix = "";
11372               fragS *padding_fragP;
11373               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11374                   == BRANCH_PREFIX)
11375                 {
11376                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11377                   switch (fragP->tc_frag_data.default_prefix)
11378                     {
11379                     default:
11380                       abort ();
11381                       break;
11382                     case CS_PREFIX_OPCODE:
11383                       prefix = " cs";
11384                       break;
11385                     case DS_PREFIX_OPCODE:
11386                       prefix = " ds";
11387                       break;
11388                     case ES_PREFIX_OPCODE:
11389                       prefix = " es";
11390                       break;
11391                     case FS_PREFIX_OPCODE:
11392                       prefix = " fs";
11393                       break;
11394                     case GS_PREFIX_OPCODE:
11395                       prefix = " gs";
11396                       break;
11397                     case SS_PREFIX_OPCODE:
11398                       prefix = " ss";
11399                       break;
11400                     }
11401                   if (padding_fragP)
11402                     msg = _("%s:%u: add %d%s at 0x%llx to align "
11403                             "%s within %d-byte boundary\n");
11404                   else
11405                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
11406                             "align %s within %d-byte boundary\n");
11407                 }
11408               else
11409                 {
11410                   padding_fragP = fragP;
11411                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11412                           "%s within %d-byte boundary\n");
11413                 }
11414
11415               if (padding_fragP)
11416                 switch (padding_fragP->tc_frag_data.branch_type)
11417                   {
11418                   case align_branch_jcc:
11419                     branch = "jcc";
11420                     break;
11421                   case align_branch_fused:
11422                     branch = "fused jcc";
11423                     break;
11424                   case align_branch_jmp:
11425                     branch = "jmp";
11426                     break;
11427                   case align_branch_call:
11428                     branch = "call";
11429                     break;
11430                   case align_branch_indirect:
11431                     branch = "indiret branch";
11432                     break;
11433                   case align_branch_ret:
11434                     branch = "ret";
11435                     break;
11436                   default:
11437                     break;
11438                   }
11439
11440               fprintf (stdout, msg,
11441                        fragP->fr_file, fragP->fr_line, size, prefix,
11442                        (long long) fragP->fr_address, branch,
11443                        1 << align_branch_power);
11444             }
11445           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11446             memset (fragP->fr_opcode,
11447                     fragP->tc_frag_data.default_prefix, size);
11448           else
11449             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11450                                 size, 0);
11451           fragP->fr_fix += size;
11452         }
11453       return;
11454     }
11455
11456   opcode = (unsigned char *) fragP->fr_opcode;
11457
11458   /* Address we want to reach in file space.  */
11459   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11460
11461   /* Address opcode resides at in file space.  */
11462   opcode_address = fragP->fr_address + fragP->fr_fix;
11463
11464   /* Displacement from opcode start to fill into instruction.  */
11465   displacement_from_opcode_start = target_address - opcode_address;
11466
11467   if ((fragP->fr_subtype & BIG) == 0)
11468     {
11469       /* Don't have to change opcode.  */
11470       extension = 1;            /* 1 opcode + 1 displacement  */
11471       where_to_put_displacement = &opcode[1];
11472     }
11473   else
11474     {
11475       if (no_cond_jump_promotion
11476           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11477         as_warn_where (fragP->fr_file, fragP->fr_line,
11478                        _("long jump required"));
11479
11480       switch (fragP->fr_subtype)
11481         {
11482         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11483           extension = 4;                /* 1 opcode + 4 displacement  */
11484           opcode[0] = 0xe9;
11485           where_to_put_displacement = &opcode[1];
11486           break;
11487
11488         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11489           extension = 2;                /* 1 opcode + 2 displacement  */
11490           opcode[0] = 0xe9;
11491           where_to_put_displacement = &opcode[1];
11492           break;
11493
11494         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11495         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11496           extension = 5;                /* 2 opcode + 4 displacement  */
11497           opcode[1] = opcode[0] + 0x10;
11498           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11499           where_to_put_displacement = &opcode[2];
11500           break;
11501
11502         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11503           extension = 3;                /* 2 opcode + 2 displacement  */
11504           opcode[1] = opcode[0] + 0x10;
11505           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11506           where_to_put_displacement = &opcode[2];
11507           break;
11508
11509         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11510           extension = 4;
11511           opcode[0] ^= 1;
11512           opcode[1] = 3;
11513           opcode[2] = 0xe9;
11514           where_to_put_displacement = &opcode[3];
11515           break;
11516
11517         default:
11518           BAD_CASE (fragP->fr_subtype);
11519           break;
11520         }
11521     }
11522
11523   /* If size if less then four we are sure that the operand fits,
11524      but if it's 4, then it could be that the displacement is larger
11525      then -/+ 2GB.  */
11526   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11527       && object_64bit
11528       && ((addressT) (displacement_from_opcode_start - extension
11529                       + ((addressT) 1 << 31))
11530           > (((addressT) 2 << 31) - 1)))
11531     {
11532       as_bad_where (fragP->fr_file, fragP->fr_line,
11533                     _("jump target out of range"));
11534       /* Make us emit 0.  */
11535       displacement_from_opcode_start = extension;
11536     }
11537   /* Now put displacement after opcode.  */
11538   md_number_to_chars ((char *) where_to_put_displacement,
11539                       (valueT) (displacement_from_opcode_start - extension),
11540                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11541   fragP->fr_fix += extension;
11542 }
11543 \f
11544 /* Apply a fixup (fixP) to segment data, once it has been determined
11545    by our caller that we have all the info we need to fix it up.
11546
11547    Parameter valP is the pointer to the value of the bits.
11548
11549    On the 386, immediates, displacements, and data pointers are all in
11550    the same (little-endian) format, so we don't need to care about which
11551    we are handling.  */
11552
11553 void
11554 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11555 {
11556   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11557   valueT value = *valP;
11558
11559 #if !defined (TE_Mach)
11560   if (fixP->fx_pcrel)
11561     {
11562       switch (fixP->fx_r_type)
11563         {
11564         default:
11565           break;
11566
11567         case BFD_RELOC_64:
11568           fixP->fx_r_type = BFD_RELOC_64_PCREL;
11569           break;
11570         case BFD_RELOC_32:
11571         case BFD_RELOC_X86_64_32S:
11572           fixP->fx_r_type = BFD_RELOC_32_PCREL;
11573           break;
11574         case BFD_RELOC_16:
11575           fixP->fx_r_type = BFD_RELOC_16_PCREL;
11576           break;
11577         case BFD_RELOC_8:
11578           fixP->fx_r_type = BFD_RELOC_8_PCREL;
11579           break;
11580         }
11581     }
11582
11583   if (fixP->fx_addsy != NULL
11584       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11585           || fixP->fx_r_type == BFD_RELOC_64_PCREL
11586           || fixP->fx_r_type == BFD_RELOC_16_PCREL
11587           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11588       && !use_rela_relocations)
11589     {
11590       /* This is a hack.  There should be a better way to handle this.
11591          This covers for the fact that bfd_install_relocation will
11592          subtract the current location (for partial_inplace, PC relative
11593          relocations); see more below.  */
11594 #ifndef OBJ_AOUT
11595       if (IS_ELF
11596 #ifdef TE_PE
11597           || OUTPUT_FLAVOR == bfd_target_coff_flavour
11598 #endif
11599           )
11600         value += fixP->fx_where + fixP->fx_frag->fr_address;
11601 #endif
11602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11603       if (IS_ELF)
11604         {
11605           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11606
11607           if ((sym_seg == seg
11608                || (symbol_section_p (fixP->fx_addsy)
11609                    && sym_seg != absolute_section))
11610               && !generic_force_reloc (fixP))
11611             {
11612               /* Yes, we add the values in twice.  This is because
11613                  bfd_install_relocation subtracts them out again.  I think
11614                  bfd_install_relocation is broken, but I don't dare change
11615                  it.  FIXME.  */
11616               value += fixP->fx_where + fixP->fx_frag->fr_address;
11617             }
11618         }
11619 #endif
11620 #if defined (OBJ_COFF) && defined (TE_PE)
11621       /* For some reason, the PE format does not store a
11622          section address offset for a PC relative symbol.  */
11623       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11624           || S_IS_WEAK (fixP->fx_addsy))
11625         value += md_pcrel_from (fixP);
11626 #endif
11627     }
11628 #if defined (OBJ_COFF) && defined (TE_PE)
11629   if (fixP->fx_addsy != NULL
11630       && S_IS_WEAK (fixP->fx_addsy)
11631       /* PR 16858: Do not modify weak function references.  */
11632       && ! fixP->fx_pcrel)
11633     {
11634 #if !defined (TE_PEP)
11635       /* For x86 PE weak function symbols are neither PC-relative
11636          nor do they set S_IS_FUNCTION.  So the only reliable way
11637          to detect them is to check the flags of their containing
11638          section.  */
11639       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11640           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11641         ;
11642       else
11643 #endif
11644       value -= S_GET_VALUE (fixP->fx_addsy);
11645     }
11646 #endif
11647
11648   /* Fix a few things - the dynamic linker expects certain values here,
11649      and we must not disappoint it.  */
11650 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11651   if (IS_ELF && fixP->fx_addsy)
11652     switch (fixP->fx_r_type)
11653       {
11654       case BFD_RELOC_386_PLT32:
11655       case BFD_RELOC_X86_64_PLT32:
11656         /* Make the jump instruction point to the address of the operand.
11657            At runtime we merely add the offset to the actual PLT entry.
11658            NB: Subtract the offset size only for jump instructions.  */
11659         if (fixP->fx_pcrel)
11660           value = -4;
11661         break;
11662
11663       case BFD_RELOC_386_TLS_GD:
11664       case BFD_RELOC_386_TLS_LDM:
11665       case BFD_RELOC_386_TLS_IE_32:
11666       case BFD_RELOC_386_TLS_IE:
11667       case BFD_RELOC_386_TLS_GOTIE:
11668       case BFD_RELOC_386_TLS_GOTDESC:
11669       case BFD_RELOC_X86_64_TLSGD:
11670       case BFD_RELOC_X86_64_TLSLD:
11671       case BFD_RELOC_X86_64_GOTTPOFF:
11672       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11673         value = 0; /* Fully resolved at runtime.  No addend.  */
11674         /* Fallthrough */
11675       case BFD_RELOC_386_TLS_LE:
11676       case BFD_RELOC_386_TLS_LDO_32:
11677       case BFD_RELOC_386_TLS_LE_32:
11678       case BFD_RELOC_X86_64_DTPOFF32:
11679       case BFD_RELOC_X86_64_DTPOFF64:
11680       case BFD_RELOC_X86_64_TPOFF32:
11681       case BFD_RELOC_X86_64_TPOFF64:
11682         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11683         break;
11684
11685       case BFD_RELOC_386_TLS_DESC_CALL:
11686       case BFD_RELOC_X86_64_TLSDESC_CALL:
11687         value = 0; /* Fully resolved at runtime.  No addend.  */
11688         S_SET_THREAD_LOCAL (fixP->fx_addsy);
11689         fixP->fx_done = 0;
11690         return;
11691
11692       case BFD_RELOC_VTABLE_INHERIT:
11693       case BFD_RELOC_VTABLE_ENTRY:
11694         fixP->fx_done = 0;
11695         return;
11696
11697       default:
11698         break;
11699       }
11700 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
11701   *valP = value;
11702 #endif /* !defined (TE_Mach)  */
11703
11704   /* Are we finished with this relocation now?  */
11705   if (fixP->fx_addsy == NULL)
11706     fixP->fx_done = 1;
11707 #if defined (OBJ_COFF) && defined (TE_PE)
11708   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11709     {
11710       fixP->fx_done = 0;
11711       /* Remember value for tc_gen_reloc.  */
11712       fixP->fx_addnumber = value;
11713       /* Clear out the frag for now.  */
11714       value = 0;
11715     }
11716 #endif
11717   else if (use_rela_relocations)
11718     {
11719       fixP->fx_no_overflow = 1;
11720       /* Remember value for tc_gen_reloc.  */
11721       fixP->fx_addnumber = value;
11722       value = 0;
11723     }
11724
11725   md_number_to_chars (p, value, fixP->fx_size);
11726 }
11727 \f
11728 const char *
11729 md_atof (int type, char *litP, int *sizeP)
11730 {
11731   /* This outputs the LITTLENUMs in REVERSE order;
11732      in accord with the bigendian 386.  */
11733   return ieee_md_atof (type, litP, sizeP, FALSE);
11734 }
11735 \f
11736 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11737
11738 static char *
11739 output_invalid (int c)
11740 {
11741   if (ISPRINT (c))
11742     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11743               "'%c'", c);
11744   else
11745     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11746               "(0x%x)", (unsigned char) c);
11747   return output_invalid_buf;
11748 }
11749
11750 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11751
11752 static const reg_entry *
11753 parse_real_register (char *reg_string, char **end_op)
11754 {
11755   char *s = reg_string;
11756   char *p;
11757   char reg_name_given[MAX_REG_NAME_SIZE + 1];
11758   const reg_entry *r;
11759
11760   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
11761   if (*s == REGISTER_PREFIX)
11762     ++s;
11763
11764   if (is_space_char (*s))
11765     ++s;
11766
11767   p = reg_name_given;
11768   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11769     {
11770       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11771         return (const reg_entry *) NULL;
11772       s++;
11773     }
11774
11775   /* For naked regs, make sure that we are not dealing with an identifier.
11776      This prevents confusing an identifier like `eax_var' with register
11777      `eax'.  */
11778   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11779     return (const reg_entry *) NULL;
11780
11781   *end_op = s;
11782
11783   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11784
11785   /* Handle floating point regs, allowing spaces in the (i) part.  */
11786   if (r == i386_regtab /* %st is first entry of table  */)
11787     {
11788       if (!cpu_arch_flags.bitfield.cpu8087
11789           && !cpu_arch_flags.bitfield.cpu287
11790           && !cpu_arch_flags.bitfield.cpu387)
11791         return (const reg_entry *) NULL;
11792
11793       if (is_space_char (*s))
11794         ++s;
11795       if (*s == '(')
11796         {
11797           ++s;
11798           if (is_space_char (*s))
11799             ++s;
11800           if (*s >= '0' && *s <= '7')
11801             {
11802               int fpr = *s - '0';
11803               ++s;
11804               if (is_space_char (*s))
11805                 ++s;
11806               if (*s == ')')
11807                 {
11808                   *end_op = s + 1;
11809                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11810                   know (r);
11811                   return r + fpr;
11812                 }
11813             }
11814           /* We have "%st(" then garbage.  */
11815           return (const reg_entry *) NULL;
11816         }
11817     }
11818
11819   if (r == NULL || allow_pseudo_reg)
11820     return r;
11821
11822   if (operand_type_all_zero (&r->reg_type))
11823     return (const reg_entry *) NULL;
11824
11825   if ((r->reg_type.bitfield.dword
11826        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11827        || r->reg_type.bitfield.class == RegCR
11828        || r->reg_type.bitfield.class == RegDR
11829        || r->reg_type.bitfield.class == RegTR)
11830       && !cpu_arch_flags.bitfield.cpui386)
11831     return (const reg_entry *) NULL;
11832
11833   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11834     return (const reg_entry *) NULL;
11835
11836   if (!cpu_arch_flags.bitfield.cpuavx512f)
11837     {
11838       if (r->reg_type.bitfield.zmmword
11839           || r->reg_type.bitfield.class == RegMask)
11840         return (const reg_entry *) NULL;
11841
11842       if (!cpu_arch_flags.bitfield.cpuavx)
11843         {
11844           if (r->reg_type.bitfield.ymmword)
11845             return (const reg_entry *) NULL;
11846
11847           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11848             return (const reg_entry *) NULL;
11849         }
11850     }
11851
11852   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11853     return (const reg_entry *) NULL;
11854
11855   /* Don't allow fake index register unless allow_index_reg isn't 0. */
11856   if (!allow_index_reg && r->reg_num == RegIZ)
11857     return (const reg_entry *) NULL;
11858
11859   /* Upper 16 vector registers are only available with VREX in 64bit
11860      mode, and require EVEX encoding.  */
11861   if (r->reg_flags & RegVRex)
11862     {
11863       if (!cpu_arch_flags.bitfield.cpuavx512f
11864           || flag_code != CODE_64BIT)
11865         return (const reg_entry *) NULL;
11866
11867       i.vec_encoding = vex_encoding_evex;
11868     }
11869
11870   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11871       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11872       && flag_code != CODE_64BIT)
11873     return (const reg_entry *) NULL;
11874
11875   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11876       && !intel_syntax)
11877     return (const reg_entry *) NULL;
11878
11879   return r;
11880 }
11881
11882 /* REG_STRING starts *before* REGISTER_PREFIX.  */
11883
11884 static const reg_entry *
11885 parse_register (char *reg_string, char **end_op)
11886 {
11887   const reg_entry *r;
11888
11889   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11890     r = parse_real_register (reg_string, end_op);
11891   else
11892     r = NULL;
11893   if (!r)
11894     {
11895       char *save = input_line_pointer;
11896       char c;
11897       symbolS *symbolP;
11898
11899       input_line_pointer = reg_string;
11900       c = get_symbol_name (&reg_string);
11901       symbolP = symbol_find (reg_string);
11902       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11903         {
11904           const expressionS *e = symbol_get_value_expression (symbolP);
11905
11906           know (e->X_op == O_register);
11907           know (e->X_add_number >= 0
11908                 && (valueT) e->X_add_number < i386_regtab_size);
11909           r = i386_regtab + e->X_add_number;
11910           if ((r->reg_flags & RegVRex))
11911             i.vec_encoding = vex_encoding_evex;
11912           *end_op = input_line_pointer;
11913         }
11914       *input_line_pointer = c;
11915       input_line_pointer = save;
11916     }
11917   return r;
11918 }
11919
11920 int
11921 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11922 {
11923   const reg_entry *r;
11924   char *end = input_line_pointer;
11925
11926   *end = *nextcharP;
11927   r = parse_register (name, &input_line_pointer);
11928   if (r && end <= input_line_pointer)
11929     {
11930       *nextcharP = *input_line_pointer;
11931       *input_line_pointer = 0;
11932       e->X_op = O_register;
11933       e->X_add_number = r - i386_regtab;
11934       return 1;
11935     }
11936   input_line_pointer = end;
11937   *end = 0;
11938   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11939 }
11940
11941 void
11942 md_operand (expressionS *e)
11943 {
11944   char *end;
11945   const reg_entry *r;
11946
11947   switch (*input_line_pointer)
11948     {
11949     case REGISTER_PREFIX:
11950       r = parse_real_register (input_line_pointer, &end);
11951       if (r)
11952         {
11953           e->X_op = O_register;
11954           e->X_add_number = r - i386_regtab;
11955           input_line_pointer = end;
11956         }
11957       break;
11958
11959     case '[':
11960       gas_assert (intel_syntax);
11961       end = input_line_pointer++;
11962       expression (e);
11963       if (*input_line_pointer == ']')
11964         {
11965           ++input_line_pointer;
11966           e->X_op_symbol = make_expr_symbol (e);
11967           e->X_add_symbol = NULL;
11968           e->X_add_number = 0;
11969           e->X_op = O_index;
11970         }
11971       else
11972         {
11973           e->X_op = O_absent;
11974           input_line_pointer = end;
11975         }
11976       break;
11977     }
11978 }
11979
11980 \f
11981 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11982 const char *md_shortopts = "kVQ:sqnO::";
11983 #else
11984 const char *md_shortopts = "qnO::";
11985 #endif
11986
11987 #define OPTION_32 (OPTION_MD_BASE + 0)
11988 #define OPTION_64 (OPTION_MD_BASE + 1)
11989 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
11990 #define OPTION_MARCH (OPTION_MD_BASE + 3)
11991 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
11992 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
11993 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
11994 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
11995 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
11996 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
11997 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11998 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11999 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12000 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12001 #define OPTION_X32 (OPTION_MD_BASE + 14)
12002 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12003 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12004 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12005 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12006 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12007 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12008 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12009 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12010 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12011 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12012 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12013 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12014 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12015 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12016 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12017 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12018
12019 struct option md_longopts[] =
12020 {
12021   {"32", no_argument, NULL, OPTION_32},
12022 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12023      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12024   {"64", no_argument, NULL, OPTION_64},
12025 #endif
12026 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12027   {"x32", no_argument, NULL, OPTION_X32},
12028   {"mshared", no_argument, NULL, OPTION_MSHARED},
12029   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12030 #endif
12031   {"divide", no_argument, NULL, OPTION_DIVIDE},
12032   {"march", required_argument, NULL, OPTION_MARCH},
12033   {"mtune", required_argument, NULL, OPTION_MTUNE},
12034   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12035   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12036   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12037   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12038   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12039   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12040   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12041   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12042   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12043   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12044   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12045   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12046 # if defined (TE_PE) || defined (TE_PEP)
12047   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12048 #endif
12049   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12050   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12051   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12052   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12053   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12054   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12055   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12056   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12057   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12058   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12059   {NULL, no_argument, NULL, 0}
12060 };
12061 size_t md_longopts_size = sizeof (md_longopts);
12062
12063 int
12064 md_parse_option (int c, const char *arg)
12065 {
12066   unsigned int j;
12067   char *arch, *next, *saved, *type;
12068
12069   switch (c)
12070     {
12071     case 'n':
12072       optimize_align_code = 0;
12073       break;
12074
12075     case 'q':
12076       quiet_warnings = 1;
12077       break;
12078
12079 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12080       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12081          should be emitted or not.  FIXME: Not implemented.  */
12082     case 'Q':
12083       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12084         return 0;
12085       break;
12086
12087       /* -V: SVR4 argument to print version ID.  */
12088     case 'V':
12089       print_version_id ();
12090       break;
12091
12092       /* -k: Ignore for FreeBSD compatibility.  */
12093     case 'k':
12094       break;
12095
12096     case 's':
12097       /* -s: On i386 Solaris, this tells the native assembler to use
12098          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12099       break;
12100
12101     case OPTION_MSHARED:
12102       shared = 1;
12103       break;
12104
12105     case OPTION_X86_USED_NOTE:
12106       if (strcasecmp (arg, "yes") == 0)
12107         x86_used_note = 1;
12108       else if (strcasecmp (arg, "no") == 0)
12109         x86_used_note = 0;
12110       else
12111         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12112       break;
12113
12114
12115 #endif
12116 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12117      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12118     case OPTION_64:
12119       {
12120         const char **list, **l;
12121
12122         list = bfd_target_list ();
12123         for (l = list; *l != NULL; l++)
12124           if (CONST_STRNEQ (*l, "elf64-x86-64")
12125               || strcmp (*l, "coff-x86-64") == 0
12126               || strcmp (*l, "pe-x86-64") == 0
12127               || strcmp (*l, "pei-x86-64") == 0
12128               || strcmp (*l, "mach-o-x86-64") == 0)
12129             {
12130               default_arch = "x86_64";
12131               break;
12132             }
12133         if (*l == NULL)
12134           as_fatal (_("no compiled in support for x86_64"));
12135         free (list);
12136       }
12137       break;
12138 #endif
12139
12140 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12141     case OPTION_X32:
12142       if (IS_ELF)
12143         {
12144           const char **list, **l;
12145
12146           list = bfd_target_list ();
12147           for (l = list; *l != NULL; l++)
12148             if (CONST_STRNEQ (*l, "elf32-x86-64"))
12149               {
12150                 default_arch = "x86_64:32";
12151                 break;
12152               }
12153           if (*l == NULL)
12154             as_fatal (_("no compiled in support for 32bit x86_64"));
12155           free (list);
12156         }
12157       else
12158         as_fatal (_("32bit x86_64 is only supported for ELF"));
12159       break;
12160 #endif
12161
12162     case OPTION_32:
12163       default_arch = "i386";
12164       break;
12165
12166     case OPTION_DIVIDE:
12167 #ifdef SVR4_COMMENT_CHARS
12168       {
12169         char *n, *t;
12170         const char *s;
12171
12172         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12173         t = n;
12174         for (s = i386_comment_chars; *s != '\0'; s++)
12175           if (*s != '/')
12176             *t++ = *s;
12177         *t = '\0';
12178         i386_comment_chars = n;
12179       }
12180 #endif
12181       break;
12182
12183     case OPTION_MARCH:
12184       saved = xstrdup (arg);
12185       arch = saved;
12186       /* Allow -march=+nosse.  */
12187       if (*arch == '+')
12188         arch++;
12189       do
12190         {
12191           if (*arch == '.')
12192             as_fatal (_("invalid -march= option: `%s'"), arg);
12193           next = strchr (arch, '+');
12194           if (next)
12195             *next++ = '\0';
12196           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12197             {
12198               if (strcmp (arch, cpu_arch [j].name) == 0)
12199                 {
12200                   /* Processor.  */
12201                   if (! cpu_arch[j].flags.bitfield.cpui386)
12202                     continue;
12203
12204                   cpu_arch_name = cpu_arch[j].name;
12205                   cpu_sub_arch_name = NULL;
12206                   cpu_arch_flags = cpu_arch[j].flags;
12207                   cpu_arch_isa = cpu_arch[j].type;
12208                   cpu_arch_isa_flags = cpu_arch[j].flags;
12209                   if (!cpu_arch_tune_set)
12210                     {
12211                       cpu_arch_tune = cpu_arch_isa;
12212                       cpu_arch_tune_flags = cpu_arch_isa_flags;
12213                     }
12214                   break;
12215                 }
12216               else if (*cpu_arch [j].name == '.'
12217                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
12218                 {
12219                   /* ISA extension.  */
12220                   i386_cpu_flags flags;
12221
12222                   flags = cpu_flags_or (cpu_arch_flags,
12223                                         cpu_arch[j].flags);
12224
12225                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12226                     {
12227                       if (cpu_sub_arch_name)
12228                         {
12229                           char *name = cpu_sub_arch_name;
12230                           cpu_sub_arch_name = concat (name,
12231                                                       cpu_arch[j].name,
12232                                                       (const char *) NULL);
12233                           free (name);
12234                         }
12235                       else
12236                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12237                       cpu_arch_flags = flags;
12238                       cpu_arch_isa_flags = flags;
12239                     }
12240                   else
12241                     cpu_arch_isa_flags
12242                       = cpu_flags_or (cpu_arch_isa_flags,
12243                                       cpu_arch[j].flags);
12244                   break;
12245                 }
12246             }
12247
12248           if (j >= ARRAY_SIZE (cpu_arch))
12249             {
12250               /* Disable an ISA extension.  */
12251               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12252                 if (strcmp (arch, cpu_noarch [j].name) == 0)
12253                   {
12254                     i386_cpu_flags flags;
12255
12256                     flags = cpu_flags_and_not (cpu_arch_flags,
12257                                                cpu_noarch[j].flags);
12258                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12259                       {
12260                         if (cpu_sub_arch_name)
12261                           {
12262                             char *name = cpu_sub_arch_name;
12263                             cpu_sub_arch_name = concat (arch,
12264                                                         (const char *) NULL);
12265                             free (name);
12266                           }
12267                         else
12268                           cpu_sub_arch_name = xstrdup (arch);
12269                         cpu_arch_flags = flags;
12270                         cpu_arch_isa_flags = flags;
12271                       }
12272                     break;
12273                   }
12274
12275               if (j >= ARRAY_SIZE (cpu_noarch))
12276                 j = ARRAY_SIZE (cpu_arch);
12277             }
12278
12279           if (j >= ARRAY_SIZE (cpu_arch))
12280             as_fatal (_("invalid -march= option: `%s'"), arg);
12281
12282           arch = next;
12283         }
12284       while (next != NULL);
12285       free (saved);
12286       break;
12287
12288     case OPTION_MTUNE:
12289       if (*arg == '.')
12290         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12291       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12292         {
12293           if (strcmp (arg, cpu_arch [j].name) == 0)
12294             {
12295               cpu_arch_tune_set = 1;
12296               cpu_arch_tune = cpu_arch [j].type;
12297               cpu_arch_tune_flags = cpu_arch[j].flags;
12298               break;
12299             }
12300         }
12301       if (j >= ARRAY_SIZE (cpu_arch))
12302         as_fatal (_("invalid -mtune= option: `%s'"), arg);
12303       break;
12304
12305     case OPTION_MMNEMONIC:
12306       if (strcasecmp (arg, "att") == 0)
12307         intel_mnemonic = 0;
12308       else if (strcasecmp (arg, "intel") == 0)
12309         intel_mnemonic = 1;
12310       else
12311         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12312       break;
12313
12314     case OPTION_MSYNTAX:
12315       if (strcasecmp (arg, "att") == 0)
12316         intel_syntax = 0;
12317       else if (strcasecmp (arg, "intel") == 0)
12318         intel_syntax = 1;
12319       else
12320         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12321       break;
12322
12323     case OPTION_MINDEX_REG:
12324       allow_index_reg = 1;
12325       break;
12326
12327     case OPTION_MNAKED_REG:
12328       allow_naked_reg = 1;
12329       break;
12330
12331     case OPTION_MSSE2AVX:
12332       sse2avx = 1;
12333       break;
12334
12335     case OPTION_MSSE_CHECK:
12336       if (strcasecmp (arg, "error") == 0)
12337         sse_check = check_error;
12338       else if (strcasecmp (arg, "warning") == 0)
12339         sse_check = check_warning;
12340       else if (strcasecmp (arg, "none") == 0)
12341         sse_check = check_none;
12342       else
12343         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12344       break;
12345
12346     case OPTION_MOPERAND_CHECK:
12347       if (strcasecmp (arg, "error") == 0)
12348         operand_check = check_error;
12349       else if (strcasecmp (arg, "warning") == 0)
12350         operand_check = check_warning;
12351       else if (strcasecmp (arg, "none") == 0)
12352         operand_check = check_none;
12353       else
12354         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12355       break;
12356
12357     case OPTION_MAVXSCALAR:
12358       if (strcasecmp (arg, "128") == 0)
12359         avxscalar = vex128;
12360       else if (strcasecmp (arg, "256") == 0)
12361         avxscalar = vex256;
12362       else
12363         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12364       break;
12365
12366     case OPTION_MVEXWIG:
12367       if (strcmp (arg, "0") == 0)
12368         vexwig = vexw0;
12369       else if (strcmp (arg, "1") == 0)
12370         vexwig = vexw1;
12371       else
12372         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12373       break;
12374
12375     case OPTION_MADD_BND_PREFIX:
12376       add_bnd_prefix = 1;
12377       break;
12378
12379     case OPTION_MEVEXLIG:
12380       if (strcmp (arg, "128") == 0)
12381         evexlig = evexl128;
12382       else if (strcmp (arg, "256") == 0)
12383         evexlig = evexl256;
12384       else  if (strcmp (arg, "512") == 0)
12385         evexlig = evexl512;
12386       else
12387         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12388       break;
12389
12390     case OPTION_MEVEXRCIG:
12391       if (strcmp (arg, "rne") == 0)
12392         evexrcig = rne;
12393       else if (strcmp (arg, "rd") == 0)
12394         evexrcig = rd;
12395       else if (strcmp (arg, "ru") == 0)
12396         evexrcig = ru;
12397       else if (strcmp (arg, "rz") == 0)
12398         evexrcig = rz;
12399       else
12400         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12401       break;
12402
12403     case OPTION_MEVEXWIG:
12404       if (strcmp (arg, "0") == 0)
12405         evexwig = evexw0;
12406       else if (strcmp (arg, "1") == 0)
12407         evexwig = evexw1;
12408       else
12409         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12410       break;
12411
12412 # if defined (TE_PE) || defined (TE_PEP)
12413     case OPTION_MBIG_OBJ:
12414       use_big_obj = 1;
12415       break;
12416 #endif
12417
12418     case OPTION_MOMIT_LOCK_PREFIX:
12419       if (strcasecmp (arg, "yes") == 0)
12420         omit_lock_prefix = 1;
12421       else if (strcasecmp (arg, "no") == 0)
12422         omit_lock_prefix = 0;
12423       else
12424         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12425       break;
12426
12427     case OPTION_MFENCE_AS_LOCK_ADD:
12428       if (strcasecmp (arg, "yes") == 0)
12429         avoid_fence = 1;
12430       else if (strcasecmp (arg, "no") == 0)
12431         avoid_fence = 0;
12432       else
12433         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12434       break;
12435
12436     case OPTION_MRELAX_RELOCATIONS:
12437       if (strcasecmp (arg, "yes") == 0)
12438         generate_relax_relocations = 1;
12439       else if (strcasecmp (arg, "no") == 0)
12440         generate_relax_relocations = 0;
12441       else
12442         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12443       break;
12444
12445     case OPTION_MALIGN_BRANCH_BOUNDARY:
12446       {
12447         char *end;
12448         long int align = strtoul (arg, &end, 0);
12449         if (*end == '\0')
12450           {
12451             if (align == 0)
12452               {
12453                 align_branch_power = 0;
12454                 break;
12455               }
12456             else if (align >= 16)
12457               {
12458                 int align_power;
12459                 for (align_power = 0;
12460                      (align & 1) == 0;
12461                      align >>= 1, align_power++)
12462                   continue;
12463                 /* Limit alignment power to 31.  */
12464                 if (align == 1 && align_power < 32)
12465                   {
12466                     align_branch_power = align_power;
12467                     break;
12468                   }
12469               }
12470           }
12471         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12472       }
12473       break;
12474
12475     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12476       {
12477         char *end;
12478         int align = strtoul (arg, &end, 0);
12479         /* Some processors only support 5 prefixes.  */
12480         if (*end == '\0' && align >= 0 && align < 6)
12481           {
12482             align_branch_prefix_size = align;
12483             break;
12484           }
12485         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12486                   arg);
12487       }
12488       break;
12489
12490     case OPTION_MALIGN_BRANCH:
12491       align_branch = 0;
12492       saved = xstrdup (arg);
12493       type = saved;
12494       do
12495         {
12496           next = strchr (type, '+');
12497           if (next)
12498             *next++ = '\0';
12499           if (strcasecmp (type, "jcc") == 0)
12500             align_branch |= align_branch_jcc_bit;
12501           else if (strcasecmp (type, "fused") == 0)
12502             align_branch |= align_branch_fused_bit;
12503           else if (strcasecmp (type, "jmp") == 0)
12504             align_branch |= align_branch_jmp_bit;
12505           else if (strcasecmp (type, "call") == 0)
12506             align_branch |= align_branch_call_bit;
12507           else if (strcasecmp (type, "ret") == 0)
12508             align_branch |= align_branch_ret_bit;
12509           else if (strcasecmp (type, "indirect") == 0)
12510             align_branch |= align_branch_indirect_bit;
12511           else
12512             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12513           type = next;
12514         }
12515       while (next != NULL);
12516       free (saved);
12517       break;
12518
12519     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12520       align_branch_power = 5;
12521       align_branch_prefix_size = 5;
12522       align_branch = (align_branch_jcc_bit
12523                       | align_branch_fused_bit
12524                       | align_branch_jmp_bit);
12525       break;
12526
12527     case OPTION_MAMD64:
12528       intel64 = 0;
12529       break;
12530
12531     case OPTION_MINTEL64:
12532       intel64 = 1;
12533       break;
12534
12535     case 'O':
12536       if (arg == NULL)
12537         {
12538           optimize = 1;
12539           /* Turn off -Os.  */
12540           optimize_for_space = 0;
12541         }
12542       else if (*arg == 's')
12543         {
12544           optimize_for_space = 1;
12545           /* Turn on all encoding optimizations.  */
12546           optimize = INT_MAX;
12547         }
12548       else
12549         {
12550           optimize = atoi (arg);
12551           /* Turn off -Os.  */
12552           optimize_for_space = 0;
12553         }
12554       break;
12555
12556     default:
12557       return 0;
12558     }
12559   return 1;
12560 }
12561
12562 #define MESSAGE_TEMPLATE \
12563 "                                                                                "
12564
12565 static char *
12566 output_message (FILE *stream, char *p, char *message, char *start,
12567                 int *left_p, const char *name, int len)
12568 {
12569   int size = sizeof (MESSAGE_TEMPLATE);
12570   int left = *left_p;
12571
12572   /* Reserve 2 spaces for ", " or ",\0" */
12573   left -= len + 2;
12574
12575   /* Check if there is any room.  */
12576   if (left >= 0)
12577     {
12578       if (p != start)
12579         {
12580           *p++ = ',';
12581           *p++ = ' ';
12582         }
12583       p = mempcpy (p, name, len);
12584     }
12585   else
12586     {
12587       /* Output the current message now and start a new one.  */
12588       *p++ = ',';
12589       *p = '\0';
12590       fprintf (stream, "%s\n", message);
12591       p = start;
12592       left = size - (start - message) - len - 2;
12593
12594       gas_assert (left >= 0);
12595
12596       p = mempcpy (p, name, len);
12597     }
12598
12599   *left_p = left;
12600   return p;
12601 }
12602
12603 static void
12604 show_arch (FILE *stream, int ext, int check)
12605 {
12606   static char message[] = MESSAGE_TEMPLATE;
12607   char *start = message + 27;
12608   char *p;
12609   int size = sizeof (MESSAGE_TEMPLATE);
12610   int left;
12611   const char *name;
12612   int len;
12613   unsigned int j;
12614
12615   p = start;
12616   left = size - (start - message);
12617   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12618     {
12619       /* Should it be skipped?  */
12620       if (cpu_arch [j].skip)
12621         continue;
12622
12623       name = cpu_arch [j].name;
12624       len = cpu_arch [j].len;
12625       if (*name == '.')
12626         {
12627           /* It is an extension.  Skip if we aren't asked to show it.  */
12628           if (ext)
12629             {
12630               name++;
12631               len--;
12632             }
12633           else
12634             continue;
12635         }
12636       else if (ext)
12637         {
12638           /* It is an processor.  Skip if we show only extension.  */
12639           continue;
12640         }
12641       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12642         {
12643           /* It is an impossible processor - skip.  */
12644           continue;
12645         }
12646
12647       p = output_message (stream, p, message, start, &left, name, len);
12648     }
12649
12650   /* Display disabled extensions.  */
12651   if (ext)
12652     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12653       {
12654         name = cpu_noarch [j].name;
12655         len = cpu_noarch [j].len;
12656         p = output_message (stream, p, message, start, &left, name,
12657                             len);
12658       }
12659
12660   *p = '\0';
12661   fprintf (stream, "%s\n", message);
12662 }
12663
12664 void
12665 md_show_usage (FILE *stream)
12666 {
12667 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12668   fprintf (stream, _("\
12669   -Qy, -Qn                ignored\n\
12670   -V                      print assembler version number\n\
12671   -k                      ignored\n"));
12672 #endif
12673   fprintf (stream, _("\
12674   -n                      Do not optimize code alignment\n\
12675   -q                      quieten some warnings\n"));
12676 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12677   fprintf (stream, _("\
12678   -s                      ignored\n"));
12679 #endif
12680 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12681                       || defined (TE_PE) || defined (TE_PEP))
12682   fprintf (stream, _("\
12683   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
12684 #endif
12685 #ifdef SVR4_COMMENT_CHARS
12686   fprintf (stream, _("\
12687   --divide                do not treat `/' as a comment character\n"));
12688 #else
12689   fprintf (stream, _("\
12690   --divide                ignored\n"));
12691 #endif
12692   fprintf (stream, _("\
12693   -march=CPU[,+EXTENSION...]\n\
12694                           generate code for CPU and EXTENSION, CPU is one of:\n"));
12695   show_arch (stream, 0, 1);
12696   fprintf (stream, _("\
12697                           EXTENSION is combination of:\n"));
12698   show_arch (stream, 1, 0);
12699   fprintf (stream, _("\
12700   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
12701   show_arch (stream, 0, 0);
12702   fprintf (stream, _("\
12703   -msse2avx               encode SSE instructions with VEX prefix\n"));
12704   fprintf (stream, _("\
12705   -msse-check=[none|error|warning] (default: warning)\n\
12706                           check SSE instructions\n"));
12707   fprintf (stream, _("\
12708   -moperand-check=[none|error|warning] (default: warning)\n\
12709                           check operand combinations for validity\n"));
12710   fprintf (stream, _("\
12711   -mavxscalar=[128|256] (default: 128)\n\
12712                           encode scalar AVX instructions with specific vector\n\
12713                            length\n"));
12714   fprintf (stream, _("\
12715   -mvexwig=[0|1] (default: 0)\n\
12716                           encode VEX instructions with specific VEX.W value\n\
12717                            for VEX.W bit ignored instructions\n"));
12718   fprintf (stream, _("\
12719   -mevexlig=[128|256|512] (default: 128)\n\
12720                           encode scalar EVEX instructions with specific vector\n\
12721                            length\n"));
12722   fprintf (stream, _("\
12723   -mevexwig=[0|1] (default: 0)\n\
12724                           encode EVEX instructions with specific EVEX.W value\n\
12725                            for EVEX.W bit ignored instructions\n"));
12726   fprintf (stream, _("\
12727   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12728                           encode EVEX instructions with specific EVEX.RC value\n\
12729                            for SAE-only ignored instructions\n"));
12730   fprintf (stream, _("\
12731   -mmnemonic=[att|intel] "));
12732   if (SYSV386_COMPAT)
12733     fprintf (stream, _("(default: att)\n"));
12734   else
12735     fprintf (stream, _("(default: intel)\n"));
12736   fprintf (stream, _("\
12737                           use AT&T/Intel mnemonic\n"));
12738   fprintf (stream, _("\
12739   -msyntax=[att|intel] (default: att)\n\
12740                           use AT&T/Intel syntax\n"));
12741   fprintf (stream, _("\
12742   -mindex-reg             support pseudo index registers\n"));
12743   fprintf (stream, _("\
12744   -mnaked-reg             don't require `%%' prefix for registers\n"));
12745   fprintf (stream, _("\
12746   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
12747 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12748   fprintf (stream, _("\
12749   -mshared                disable branch optimization for shared code\n"));
12750   fprintf (stream, _("\
12751   -mx86-used-note=[no|yes] "));
12752   if (DEFAULT_X86_USED_NOTE)
12753     fprintf (stream, _("(default: yes)\n"));
12754   else
12755     fprintf (stream, _("(default: no)\n"));
12756   fprintf (stream, _("\
12757                           generate x86 used ISA and feature properties\n"));
12758 #endif
12759 #if defined (TE_PE) || defined (TE_PEP)
12760   fprintf (stream, _("\
12761   -mbig-obj               generate big object files\n"));
12762 #endif
12763   fprintf (stream, _("\
12764   -momit-lock-prefix=[no|yes] (default: no)\n\
12765                           strip all lock prefixes\n"));
12766   fprintf (stream, _("\
12767   -mfence-as-lock-add=[no|yes] (default: no)\n\
12768                           encode lfence, mfence and sfence as\n\
12769                            lock addl $0x0, (%%{re}sp)\n"));
12770   fprintf (stream, _("\
12771   -mrelax-relocations=[no|yes] "));
12772   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12773     fprintf (stream, _("(default: yes)\n"));
12774   else
12775     fprintf (stream, _("(default: no)\n"));
12776   fprintf (stream, _("\
12777                           generate relax relocations\n"));
12778   fprintf (stream, _("\
12779   -malign-branch-boundary=NUM (default: 0)\n\
12780                           align branches within NUM byte boundary\n"));
12781   fprintf (stream, _("\
12782   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12783                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
12784                            indirect\n\
12785                           specify types of branches to align\n"));
12786   fprintf (stream, _("\
12787   -malign-branch-prefix-size=NUM (default: 5)\n\
12788                           align branches with NUM prefixes per instruction\n"));
12789   fprintf (stream, _("\
12790   -mbranches-within-32B-boundaries\n\
12791                           align branches within 32 byte boundary\n"));
12792   fprintf (stream, _("\
12793   -mamd64                 accept only AMD64 ISA [default]\n"));
12794   fprintf (stream, _("\
12795   -mintel64               accept only Intel64 ISA\n"));
12796 }
12797
12798 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12799      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12800      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12801
12802 /* Pick the target format to use.  */
12803
12804 const char *
12805 i386_target_format (void)
12806 {
12807   if (!strncmp (default_arch, "x86_64", 6))
12808     {
12809       update_code_flag (CODE_64BIT, 1);
12810       if (default_arch[6] == '\0')
12811         x86_elf_abi = X86_64_ABI;
12812       else
12813         x86_elf_abi = X86_64_X32_ABI;
12814     }
12815   else if (!strcmp (default_arch, "i386"))
12816     update_code_flag (CODE_32BIT, 1);
12817   else if (!strcmp (default_arch, "iamcu"))
12818     {
12819       update_code_flag (CODE_32BIT, 1);
12820       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12821         {
12822           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12823           cpu_arch_name = "iamcu";
12824           cpu_sub_arch_name = NULL;
12825           cpu_arch_flags = iamcu_flags;
12826           cpu_arch_isa = PROCESSOR_IAMCU;
12827           cpu_arch_isa_flags = iamcu_flags;
12828           if (!cpu_arch_tune_set)
12829             {
12830               cpu_arch_tune = cpu_arch_isa;
12831               cpu_arch_tune_flags = cpu_arch_isa_flags;
12832             }
12833         }
12834       else if (cpu_arch_isa != PROCESSOR_IAMCU)
12835         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12836                   cpu_arch_name);
12837     }
12838   else
12839     as_fatal (_("unknown architecture"));
12840
12841   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12842     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12843   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12844     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12845
12846   switch (OUTPUT_FLAVOR)
12847     {
12848 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12849     case bfd_target_aout_flavour:
12850       return AOUT_TARGET_FORMAT;
12851 #endif
12852 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12853 # if defined (TE_PE) || defined (TE_PEP)
12854     case bfd_target_coff_flavour:
12855       if (flag_code == CODE_64BIT)
12856         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12857       else
12858         return "pe-i386";
12859 # elif defined (TE_GO32)
12860     case bfd_target_coff_flavour:
12861       return "coff-go32";
12862 # else
12863     case bfd_target_coff_flavour:
12864       return "coff-i386";
12865 # endif
12866 #endif
12867 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12868     case bfd_target_elf_flavour:
12869       {
12870         const char *format;
12871
12872         switch (x86_elf_abi)
12873           {
12874           default:
12875             format = ELF_TARGET_FORMAT;
12876 #ifndef TE_SOLARIS
12877             tls_get_addr = "___tls_get_addr";
12878 #endif
12879             break;
12880           case X86_64_ABI:
12881             use_rela_relocations = 1;
12882             object_64bit = 1;
12883 #ifndef TE_SOLARIS
12884             tls_get_addr = "__tls_get_addr";
12885 #endif
12886             format = ELF_TARGET_FORMAT64;
12887             break;
12888           case X86_64_X32_ABI:
12889             use_rela_relocations = 1;
12890             object_64bit = 1;
12891 #ifndef TE_SOLARIS
12892             tls_get_addr = "__tls_get_addr";
12893 #endif
12894             disallow_64bit_reloc = 1;
12895             format = ELF_TARGET_FORMAT32;
12896             break;
12897           }
12898         if (cpu_arch_isa == PROCESSOR_L1OM)
12899           {
12900             if (x86_elf_abi != X86_64_ABI)
12901               as_fatal (_("Intel L1OM is 64bit only"));
12902             return ELF_TARGET_L1OM_FORMAT;
12903           }
12904         else if (cpu_arch_isa == PROCESSOR_K1OM)
12905           {
12906             if (x86_elf_abi != X86_64_ABI)
12907               as_fatal (_("Intel K1OM is 64bit only"));
12908             return ELF_TARGET_K1OM_FORMAT;
12909           }
12910         else if (cpu_arch_isa == PROCESSOR_IAMCU)
12911           {
12912             if (x86_elf_abi != I386_ABI)
12913               as_fatal (_("Intel MCU is 32bit only"));
12914             return ELF_TARGET_IAMCU_FORMAT;
12915           }
12916         else
12917           return format;
12918       }
12919 #endif
12920 #if defined (OBJ_MACH_O)
12921     case bfd_target_mach_o_flavour:
12922       if (flag_code == CODE_64BIT)
12923         {
12924           use_rela_relocations = 1;
12925           object_64bit = 1;
12926           return "mach-o-x86-64";
12927         }
12928       else
12929         return "mach-o-i386";
12930 #endif
12931     default:
12932       abort ();
12933       return NULL;
12934     }
12935 }
12936
12937 #endif /* OBJ_MAYBE_ more than one  */
12938 \f
12939 symbolS *
12940 md_undefined_symbol (char *name)
12941 {
12942   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12943       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12944       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12945       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12946     {
12947       if (!GOT_symbol)
12948         {
12949           if (symbol_find (name))
12950             as_bad (_("GOT already in symbol table"));
12951           GOT_symbol = symbol_new (name, undefined_section,
12952                                    (valueT) 0, &zero_address_frag);
12953         };
12954       return GOT_symbol;
12955     }
12956   return 0;
12957 }
12958
12959 /* Round up a section size to the appropriate boundary.  */
12960
12961 valueT
12962 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
12963 {
12964 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12965   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
12966     {
12967       /* For a.out, force the section size to be aligned.  If we don't do
12968          this, BFD will align it for us, but it will not write out the
12969          final bytes of the section.  This may be a bug in BFD, but it is
12970          easier to fix it here since that is how the other a.out targets
12971          work.  */
12972       int align;
12973
12974       align = bfd_section_alignment (segment);
12975       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
12976     }
12977 #endif
12978
12979   return size;
12980 }
12981
12982 /* On the i386, PC-relative offsets are relative to the start of the
12983    next instruction.  That is, the address of the offset, plus its
12984    size, since the offset is always the last part of the insn.  */
12985
12986 long
12987 md_pcrel_from (fixS *fixP)
12988 {
12989   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
12990 }
12991
12992 #ifndef I386COFF
12993
12994 static void
12995 s_bss (int ignore ATTRIBUTE_UNUSED)
12996 {
12997   int temp;
12998
12999 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13000   if (IS_ELF)
13001     obj_elf_section_change_hook ();
13002 #endif
13003   temp = get_absolute_expression ();
13004   subseg_set (bss_section, (subsegT) temp);
13005   demand_empty_rest_of_line ();
13006 }
13007
13008 #endif
13009
13010 /* Remember constant directive.  */
13011
13012 void
13013 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13014 {
13015   if (last_insn.kind != last_insn_directive
13016       && (bfd_section_flags (now_seg) & SEC_CODE))
13017     {
13018       last_insn.seg = now_seg;
13019       last_insn.kind = last_insn_directive;
13020       last_insn.name = "constant directive";
13021       last_insn.file = as_where (&last_insn.line);
13022     }
13023 }
13024
13025 void
13026 i386_validate_fix (fixS *fixp)
13027 {
13028   if (fixp->fx_subsy)
13029     {
13030       if (fixp->fx_subsy == GOT_symbol)
13031         {
13032           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13033             {
13034               if (!object_64bit)
13035                 abort ();
13036 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13037               if (fixp->fx_tcbit2)
13038                 fixp->fx_r_type = (fixp->fx_tcbit
13039                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13040                                    : BFD_RELOC_X86_64_GOTPCRELX);
13041               else
13042 #endif
13043                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13044             }
13045           else
13046             {
13047               if (!object_64bit)
13048                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13049               else
13050                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13051             }
13052           fixp->fx_subsy = 0;
13053         }
13054     }
13055 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13056   else if (!object_64bit)
13057     {
13058       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13059           && fixp->fx_tcbit2)
13060         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13061     }
13062 #endif
13063 }
13064
13065 arelent *
13066 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13067 {
13068   arelent *rel;
13069   bfd_reloc_code_real_type code;
13070
13071   switch (fixp->fx_r_type)
13072     {
13073 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13074     case BFD_RELOC_SIZE32:
13075     case BFD_RELOC_SIZE64:
13076       if (S_IS_DEFINED (fixp->fx_addsy)
13077           && !S_IS_EXTERNAL (fixp->fx_addsy))
13078         {
13079           /* Resolve size relocation against local symbol to size of
13080              the symbol plus addend.  */
13081           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13082           if (fixp->fx_r_type == BFD_RELOC_SIZE32
13083               && !fits_in_unsigned_long (value))
13084             as_bad_where (fixp->fx_file, fixp->fx_line,
13085                           _("symbol size computation overflow"));
13086           fixp->fx_addsy = NULL;
13087           fixp->fx_subsy = NULL;
13088           md_apply_fix (fixp, (valueT *) &value, NULL);
13089           return NULL;
13090         }
13091 #endif
13092       /* Fall through.  */
13093
13094     case BFD_RELOC_X86_64_PLT32:
13095     case BFD_RELOC_X86_64_GOT32:
13096     case BFD_RELOC_X86_64_GOTPCREL:
13097     case BFD_RELOC_X86_64_GOTPCRELX:
13098     case BFD_RELOC_X86_64_REX_GOTPCRELX:
13099     case BFD_RELOC_386_PLT32:
13100     case BFD_RELOC_386_GOT32:
13101     case BFD_RELOC_386_GOT32X:
13102     case BFD_RELOC_386_GOTOFF:
13103     case BFD_RELOC_386_GOTPC:
13104     case BFD_RELOC_386_TLS_GD:
13105     case BFD_RELOC_386_TLS_LDM:
13106     case BFD_RELOC_386_TLS_LDO_32:
13107     case BFD_RELOC_386_TLS_IE_32:
13108     case BFD_RELOC_386_TLS_IE:
13109     case BFD_RELOC_386_TLS_GOTIE:
13110     case BFD_RELOC_386_TLS_LE_32:
13111     case BFD_RELOC_386_TLS_LE:
13112     case BFD_RELOC_386_TLS_GOTDESC:
13113     case BFD_RELOC_386_TLS_DESC_CALL:
13114     case BFD_RELOC_X86_64_TLSGD:
13115     case BFD_RELOC_X86_64_TLSLD:
13116     case BFD_RELOC_X86_64_DTPOFF32:
13117     case BFD_RELOC_X86_64_DTPOFF64:
13118     case BFD_RELOC_X86_64_GOTTPOFF:
13119     case BFD_RELOC_X86_64_TPOFF32:
13120     case BFD_RELOC_X86_64_TPOFF64:
13121     case BFD_RELOC_X86_64_GOTOFF64:
13122     case BFD_RELOC_X86_64_GOTPC32:
13123     case BFD_RELOC_X86_64_GOT64:
13124     case BFD_RELOC_X86_64_GOTPCREL64:
13125     case BFD_RELOC_X86_64_GOTPC64:
13126     case BFD_RELOC_X86_64_GOTPLT64:
13127     case BFD_RELOC_X86_64_PLTOFF64:
13128     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13129     case BFD_RELOC_X86_64_TLSDESC_CALL:
13130     case BFD_RELOC_RVA:
13131     case BFD_RELOC_VTABLE_ENTRY:
13132     case BFD_RELOC_VTABLE_INHERIT:
13133 #ifdef TE_PE
13134     case BFD_RELOC_32_SECREL:
13135 #endif
13136       code = fixp->fx_r_type;
13137       break;
13138     case BFD_RELOC_X86_64_32S:
13139       if (!fixp->fx_pcrel)
13140         {
13141           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
13142           code = fixp->fx_r_type;
13143           break;
13144         }
13145       /* Fall through.  */
13146     default:
13147       if (fixp->fx_pcrel)
13148         {
13149           switch (fixp->fx_size)
13150             {
13151             default:
13152               as_bad_where (fixp->fx_file, fixp->fx_line,
13153                             _("can not do %d byte pc-relative relocation"),
13154                             fixp->fx_size);
13155               code = BFD_RELOC_32_PCREL;
13156               break;
13157             case 1: code = BFD_RELOC_8_PCREL;  break;
13158             case 2: code = BFD_RELOC_16_PCREL; break;
13159             case 4: code = BFD_RELOC_32_PCREL; break;
13160 #ifdef BFD64
13161             case 8: code = BFD_RELOC_64_PCREL; break;
13162 #endif
13163             }
13164         }
13165       else
13166         {
13167           switch (fixp->fx_size)
13168             {
13169             default:
13170               as_bad_where (fixp->fx_file, fixp->fx_line,
13171                             _("can not do %d byte relocation"),
13172                             fixp->fx_size);
13173               code = BFD_RELOC_32;
13174               break;
13175             case 1: code = BFD_RELOC_8;  break;
13176             case 2: code = BFD_RELOC_16; break;
13177             case 4: code = BFD_RELOC_32; break;
13178 #ifdef BFD64
13179             case 8: code = BFD_RELOC_64; break;
13180 #endif
13181             }
13182         }
13183       break;
13184     }
13185
13186   if ((code == BFD_RELOC_32
13187        || code == BFD_RELOC_32_PCREL
13188        || code == BFD_RELOC_X86_64_32S)
13189       && GOT_symbol
13190       && fixp->fx_addsy == GOT_symbol)
13191     {
13192       if (!object_64bit)
13193         code = BFD_RELOC_386_GOTPC;
13194       else
13195         code = BFD_RELOC_X86_64_GOTPC32;
13196     }
13197   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13198       && GOT_symbol
13199       && fixp->fx_addsy == GOT_symbol)
13200     {
13201       code = BFD_RELOC_X86_64_GOTPC64;
13202     }
13203
13204   rel = XNEW (arelent);
13205   rel->sym_ptr_ptr = XNEW (asymbol *);
13206   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13207
13208   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13209
13210   if (!use_rela_relocations)
13211     {
13212       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13213          vtable entry to be used in the relocation's section offset.  */
13214       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13215         rel->address = fixp->fx_offset;
13216 #if defined (OBJ_COFF) && defined (TE_PE)
13217       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13218         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13219       else
13220 #endif
13221       rel->addend = 0;
13222     }
13223   /* Use the rela in 64bit mode.  */
13224   else
13225     {
13226       if (disallow_64bit_reloc)
13227         switch (code)
13228           {
13229           case BFD_RELOC_X86_64_DTPOFF64:
13230           case BFD_RELOC_X86_64_TPOFF64:
13231           case BFD_RELOC_64_PCREL:
13232           case BFD_RELOC_X86_64_GOTOFF64:
13233           case BFD_RELOC_X86_64_GOT64:
13234           case BFD_RELOC_X86_64_GOTPCREL64:
13235           case BFD_RELOC_X86_64_GOTPC64:
13236           case BFD_RELOC_X86_64_GOTPLT64:
13237           case BFD_RELOC_X86_64_PLTOFF64:
13238             as_bad_where (fixp->fx_file, fixp->fx_line,
13239                           _("cannot represent relocation type %s in x32 mode"),
13240                           bfd_get_reloc_code_name (code));
13241             break;
13242           default:
13243             break;
13244           }
13245
13246       if (!fixp->fx_pcrel)
13247         rel->addend = fixp->fx_offset;
13248       else
13249         switch (code)
13250           {
13251           case BFD_RELOC_X86_64_PLT32:
13252           case BFD_RELOC_X86_64_GOT32:
13253           case BFD_RELOC_X86_64_GOTPCREL:
13254           case BFD_RELOC_X86_64_GOTPCRELX:
13255           case BFD_RELOC_X86_64_REX_GOTPCRELX:
13256           case BFD_RELOC_X86_64_TLSGD:
13257           case BFD_RELOC_X86_64_TLSLD:
13258           case BFD_RELOC_X86_64_GOTTPOFF:
13259           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13260           case BFD_RELOC_X86_64_TLSDESC_CALL:
13261             rel->addend = fixp->fx_offset - fixp->fx_size;
13262             break;
13263           default:
13264             rel->addend = (section->vma
13265                            - fixp->fx_size
13266                            + fixp->fx_addnumber
13267                            + md_pcrel_from (fixp));
13268             break;
13269           }
13270     }
13271
13272   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13273   if (rel->howto == NULL)
13274     {
13275       as_bad_where (fixp->fx_file, fixp->fx_line,
13276                     _("cannot represent relocation type %s"),
13277                     bfd_get_reloc_code_name (code));
13278       /* Set howto to a garbage value so that we can keep going.  */
13279       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13280       gas_assert (rel->howto != NULL);
13281     }
13282
13283   return rel;
13284 }
13285
13286 #include "tc-i386-intel.c"
13287
13288 void
13289 tc_x86_parse_to_dw2regnum (expressionS *exp)
13290 {
13291   int saved_naked_reg;
13292   char saved_register_dot;
13293
13294   saved_naked_reg = allow_naked_reg;
13295   allow_naked_reg = 1;
13296   saved_register_dot = register_chars['.'];
13297   register_chars['.'] = '.';
13298   allow_pseudo_reg = 1;
13299   expression_and_evaluate (exp);
13300   allow_pseudo_reg = 0;
13301   register_chars['.'] = saved_register_dot;
13302   allow_naked_reg = saved_naked_reg;
13303
13304   if (exp->X_op == O_register && exp->X_add_number >= 0)
13305     {
13306       if ((addressT) exp->X_add_number < i386_regtab_size)
13307         {
13308           exp->X_op = O_constant;
13309           exp->X_add_number = i386_regtab[exp->X_add_number]
13310                               .dw2_regnum[flag_code >> 1];
13311         }
13312       else
13313         exp->X_op = O_illegal;
13314     }
13315 }
13316
13317 void
13318 tc_x86_frame_initial_instructions (void)
13319 {
13320   static unsigned int sp_regno[2];
13321
13322   if (!sp_regno[flag_code >> 1])
13323     {
13324       char *saved_input = input_line_pointer;
13325       char sp[][4] = {"esp", "rsp"};
13326       expressionS exp;
13327
13328       input_line_pointer = sp[flag_code >> 1];
13329       tc_x86_parse_to_dw2regnum (&exp);
13330       gas_assert (exp.X_op == O_constant);
13331       sp_regno[flag_code >> 1] = exp.X_add_number;
13332       input_line_pointer = saved_input;
13333     }
13334
13335   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13336   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13337 }
13338
13339 int
13340 x86_dwarf2_addr_size (void)
13341 {
13342 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13343   if (x86_elf_abi == X86_64_X32_ABI)
13344     return 4;
13345 #endif
13346   return bfd_arch_bits_per_address (stdoutput) / 8;
13347 }
13348
13349 int
13350 i386_elf_section_type (const char *str, size_t len)
13351 {
13352   if (flag_code == CODE_64BIT
13353       && len == sizeof ("unwind") - 1
13354       && strncmp (str, "unwind", 6) == 0)
13355     return SHT_X86_64_UNWIND;
13356
13357   return -1;
13358 }
13359
13360 #ifdef TE_SOLARIS
13361 void
13362 i386_solaris_fix_up_eh_frame (segT sec)
13363 {
13364   if (flag_code == CODE_64BIT)
13365     elf_section_type (sec) = SHT_X86_64_UNWIND;
13366 }
13367 #endif
13368
13369 #ifdef TE_PE
13370 void
13371 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13372 {
13373   expressionS exp;
13374
13375   exp.X_op = O_secrel;
13376   exp.X_add_symbol = symbol;
13377   exp.X_add_number = 0;
13378   emit_expr (&exp, size);
13379 }
13380 #endif
13381
13382 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13383 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
13384
13385 bfd_vma
13386 x86_64_section_letter (int letter, const char **ptr_msg)
13387 {
13388   if (flag_code == CODE_64BIT)
13389     {
13390       if (letter == 'l')
13391         return SHF_X86_64_LARGE;
13392
13393       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13394     }
13395   else
13396     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13397   return -1;
13398 }
13399
13400 bfd_vma
13401 x86_64_section_word (char *str, size_t len)
13402 {
13403   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13404     return SHF_X86_64_LARGE;
13405
13406   return -1;
13407 }
13408
13409 static void
13410 handle_large_common (int small ATTRIBUTE_UNUSED)
13411 {
13412   if (flag_code != CODE_64BIT)
13413     {
13414       s_comm_internal (0, elf_common_parse);
13415       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13416     }
13417   else
13418     {
13419       static segT lbss_section;
13420       asection *saved_com_section_ptr = elf_com_section_ptr;
13421       asection *saved_bss_section = bss_section;
13422
13423       if (lbss_section == NULL)
13424         {
13425           flagword applicable;
13426           segT seg = now_seg;
13427           subsegT subseg = now_subseg;
13428
13429           /* The .lbss section is for local .largecomm symbols.  */
13430           lbss_section = subseg_new (".lbss", 0);
13431           applicable = bfd_applicable_section_flags (stdoutput);
13432           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13433           seg_info (lbss_section)->bss = 1;
13434
13435           subseg_set (seg, subseg);
13436         }
13437
13438       elf_com_section_ptr = &_bfd_elf_large_com_section;
13439       bss_section = lbss_section;
13440
13441       s_comm_internal (0, elf_common_parse);
13442
13443       elf_com_section_ptr = saved_com_section_ptr;
13444       bss_section = saved_bss_section;
13445     }
13446 }
13447 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */