]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blame - gas/config/tc-i386.c
Changed ld and gas BPF tests
[thirdparty/binutils-gdb.git] / gas / config / tc-i386.c
CommitLineData
b534c6d3 1/* tc-i386.c -- Assemble code for the Intel 80386
d87bef3a 2 Copyright (C) 1989-2023 Free Software Foundation, Inc.
252b5132
RH
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
ec2655a6 8 the Free Software Foundation; either version 3, or (at your option)
252b5132
RH
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
4b4da160
NC
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
252b5132 20
47926f60
KH
21/* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
3e73aa7c 23 x86_64 support by Jan Hubicka (jh@suse.cz)
0f10071e 24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
47926f60
KH
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
252b5132 27
252b5132 28#include "as.h"
3882b010 29#include "safe-ctype.h"
252b5132 30#include "subsegs.h"
316e2c05 31#include "dwarf2dbg.h"
54cfded0 32#include "dw2gencfi.h"
b52c4ee4
IB
33#include "gen-sframe.h"
34#include "sframe.h"
d2b2c203 35#include "elf/x86-64.h"
40fb9820 36#include "opcodes/i386-init.h"
5c139202 37#include "opcodes/i386-mnem.h"
41fd2579 38#include <limits.h>
41fd2579 39
c3332e24 40#ifndef INFER_ADDR_PREFIX
eecb386c 41#define INFER_ADDR_PREFIX 1
c3332e24
AM
42#endif
43
29b0f896
AM
44#ifndef DEFAULT_ARCH
45#define DEFAULT_ARCH "i386"
246fcdee 46#endif
252b5132 47
edde18a5
AM
48#ifndef INLINE
49#if __GNUC__ >= 2
50#define INLINE __inline__
51#else
52#define INLINE
53#endif
54#endif
55
6305a203
L
56/* Prefixes will be emitted in the order defined below.
57 WAIT_PREFIX must be the first prefix since FWAIT is really is an
58 instruction, and so must come before any prefixes.
59 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
42164a71 60 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
6305a203
L
61#define WAIT_PREFIX 0
62#define SEG_PREFIX 1
63#define ADDR_PREFIX 2
64#define DATA_PREFIX 3
c32fa91d 65#define REP_PREFIX 4
42164a71 66#define HLE_PREFIX REP_PREFIX
7e8b059b 67#define BND_PREFIX REP_PREFIX
c32fa91d 68#define LOCK_PREFIX 5
4e9ac44a
L
69#define REX_PREFIX 6 /* must come last. */
70#define MAX_PREFIXES 7 /* max prefixes per opcode */
6305a203
L
71
72/* we define the syntax here (modulo base,index,scale syntax) */
73#define REGISTER_PREFIX '%'
74#define IMMEDIATE_PREFIX '$'
75#define ABSOLUTE_PREFIX '*'
76
77/* these are the instruction mnemonic suffixes in AT&T syntax or
78 memory operand size in Intel syntax. */
79#define WORD_MNEM_SUFFIX 'w'
80#define BYTE_MNEM_SUFFIX 'b'
81#define SHORT_MNEM_SUFFIX 's'
82#define LONG_MNEM_SUFFIX 'l'
83#define QWORD_MNEM_SUFFIX 'q'
6305a203
L
84
85#define END_OF_INSN '\0'
86
05909f23
JB
87#define OPERAND_TYPE_NONE { .bitfield = { .class = ClassNone } }
88
79dec6b7
JB
89/* This matches the C -> StaticRounding alias in the opcode table. */
90#define commutative staticrounding
91
6305a203
L
92/*
93 'templates' is for grouping together 'template' structures for opcodes
94 of the same name. This is only used for storing the insns in the grand
95 ole hash table of insns.
96 The templates themselves start at START and range up to (but not including)
97 END.
98 */
99typedef struct
100{
d3ce72d0
NC
101 const insn_template *start;
102 const insn_template *end;
6305a203
L
103}
104templates;
105
106/* 386 operand encoding bytes: see 386 book for details of this. */
107typedef struct
108{
109 unsigned int regmem; /* codes register or memory operand */
110 unsigned int reg; /* codes register operand (or extended opcode) */
111 unsigned int mode; /* how to interpret regmem & reg */
112}
113modrm_byte;
114
115/* x86-64 extension prefix. */
116typedef int rex_byte;
117
6305a203
L
118/* 386 opcode byte to code indirect addressing. */
119typedef struct
120{
121 unsigned base;
122 unsigned index;
123 unsigned scale;
124}
125sib_byte;
126
6305a203
L
127/* x86 arch names, types and features */
128typedef struct
129{
130 const char *name; /* arch name */
6ceeed25
JB
131 unsigned int len:8; /* arch string length */
132 bool skip:1; /* show_arch should skip this. */
6305a203 133 enum processor_type type; /* arch type */
ae89daec
JB
134 i386_cpu_flags enable; /* cpu feature enable flags */
135 i386_cpu_flags disable; /* cpu feature disable flags */
6305a203
L
136}
137arch_entry;
138
78f12dd3 139static void update_code_flag (int, int);
e3bb37b5
L
140static void set_code_flag (int);
141static void set_16bit_gcc_code_flag (int);
142static void set_intel_syntax (int);
1efbbeb4 143static void set_intel_mnemonic (int);
db51cc60 144static void set_allow_index_reg (int);
7bab8ab5 145static void set_check (int);
e3bb37b5 146static void set_cpu_arch (int);
6482c264 147#ifdef TE_PE
e3bb37b5 148static void pe_directive_secrel (int);
145667f8 149static void pe_directive_secidx (int);
6482c264 150#endif
e3bb37b5
L
151static void signed_cons (int);
152static char *output_invalid (int c);
ee86248c
JB
153static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
154 const char *);
155static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
156 const char *);
a7619375 157static int i386_att_operand (char *);
e3bb37b5 158static int i386_intel_operand (char *, int);
ee86248c
JB
159static int i386_intel_simplify (expressionS *);
160static int i386_intel_parse_name (const char *, expressionS *);
e3bb37b5 161static const reg_entry *parse_register (char *, char **);
5317ad2c 162static const char *parse_insn (const char *, char *);
e3bb37b5
L
163static char *parse_operands (char *, const char *);
164static void swap_operands (void);
783c187b 165static void swap_2_operands (unsigned int, unsigned int);
48bcea9f 166static enum flag_code i386_addressing_mode (void);
e3bb37b5 167static void optimize_imm (void);
0de704b9 168static bool optimize_disp (const insn_template *t);
83b16ac6 169static const insn_template *match_template (char);
e3bb37b5
L
170static int check_string (void);
171static int process_suffix (void);
172static int check_byte_reg (void);
173static int check_long_reg (void);
174static int check_qword_reg (void);
175static int check_word_reg (void);
176static int finalize_imm (void);
177static int process_operands (void);
5e042380 178static const reg_entry *build_modrm_byte (void);
e3bb37b5
L
179static void output_insn (void);
180static void output_imm (fragS *, offsetT);
181static void output_disp (fragS *, offsetT);
29b0f896 182#ifndef I386COFF
e3bb37b5 183static void s_bss (int);
252b5132 184#endif
17d4e2a2
L
185#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
186static void handle_large_common (int small ATTRIBUTE_UNUSED);
b4a3a7b4
L
187
188/* GNU_PROPERTY_X86_ISA_1_USED. */
189static unsigned int x86_isa_1_used;
190/* GNU_PROPERTY_X86_FEATURE_2_USED. */
191static unsigned int x86_feature_2_used;
192/* Generate x86 used ISA and feature properties. */
193static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
17d4e2a2 194#endif
252b5132 195
a847613f 196static const char *default_arch = DEFAULT_ARCH;
3e73aa7c 197
8a6fb3f9
JB
198/* parse_register() returns this when a register alias cannot be used. */
199static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
200 { Dw2Inval, Dw2Inval } };
201
34684862 202static const reg_entry *reg_eax;
5e042380
JB
203static const reg_entry *reg_ds;
204static const reg_entry *reg_es;
205static const reg_entry *reg_ss;
6288d05f 206static const reg_entry *reg_st0;
6225c532
JB
207static const reg_entry *reg_k0;
208
c0f3af97
L
209/* VEX prefix. */
210typedef struct
211{
43234a1e
L
212 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
213 unsigned char bytes[4];
c0f3af97
L
214 unsigned int length;
215 /* Destination or source register specifier. */
216 const reg_entry *register_specifier;
217} vex_prefix;
218
252b5132 219/* 'md_assemble ()' gathers together information and puts it into a
47926f60 220 i386_insn. */
252b5132 221
520dc8e8
AM
222union i386_op
223 {
224 expressionS *disps;
225 expressionS *imms;
226 const reg_entry *regs;
227 };
228
a65babc9
L
229enum i386_error
230 {
b4d65f2d 231 no_error, /* Must be first. */
86e026a4 232 operand_size_mismatch,
a65babc9
L
233 operand_type_mismatch,
234 register_type_mismatch,
235 number_of_operands_mismatch,
236 invalid_instruction_suffix,
237 bad_imm4,
a65babc9
L
238 unsupported_with_intel_mnemonic,
239 unsupported_syntax,
6c30d220 240 unsupported,
9db83a32
JB
241 unsupported_on_arch,
242 unsupported_64bit,
260cd341 243 invalid_sib_address,
6c30d220 244 invalid_vsib_address,
7bab8ab5 245 invalid_vector_register_set,
260cd341 246 invalid_tmm_register_set,
0cc78721 247 invalid_dest_and_src_register_set,
43234a1e
L
248 unsupported_vector_index_register,
249 unsupported_broadcast,
43234a1e
L
250 broadcast_needed,
251 unsupported_masking,
252 mask_not_on_destination,
253 no_default_mask,
254 unsupported_rc_sae,
43234a1e 255 invalid_register_operand,
a65babc9
L
256 };
257
252b5132
RH
258struct _i386_insn
259 {
47926f60 260 /* TM holds the template for the insn were currently assembling. */
d3ce72d0 261 insn_template tm;
252b5132 262
7d5e4556
L
263 /* SUFFIX holds the instruction size suffix for byte, word, dword
264 or qword, if given. */
252b5132
RH
265 char suffix;
266
9a182d04
JB
267 /* OPCODE_LENGTH holds the number of base opcode bytes. */
268 unsigned char opcode_length;
269
47926f60 270 /* OPERANDS gives the number of given operands. */
252b5132
RH
271 unsigned int operands;
272
273 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
274 of given register, displacement, memory operands and immediate
47926f60 275 operands. */
252b5132
RH
276 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
277
278 /* TYPES [i] is the type (see above #defines) which tells us how to
520dc8e8 279 use OP[i] for the corresponding operand. */
40fb9820 280 i386_operand_type types[MAX_OPERANDS];
252b5132 281
520dc8e8
AM
282 /* Displacement expression, immediate expression, or register for each
283 operand. */
284 union i386_op op[MAX_OPERANDS];
252b5132 285
3e73aa7c
JH
286 /* Flags for operands. */
287 unsigned int flags[MAX_OPERANDS];
288#define Operand_PCrel 1
c48dadc9 289#define Operand_Mem 2
3e73aa7c 290
252b5132 291 /* Relocation type for operand */
f86103b7 292 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
252b5132 293
252b5132
RH
294 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
295 the base index byte below. */
296 const reg_entry *base_reg;
297 const reg_entry *index_reg;
298 unsigned int log2_scale_factor;
299
300 /* SEG gives the seg_entries of this insn. They are zero unless
47926f60 301 explicit segment overrides are given. */
5e042380 302 const reg_entry *seg[2];
252b5132
RH
303
304 /* PREFIX holds all the given prefix opcodes (usually null).
305 PREFIXES is the number of prefix opcodes. */
306 unsigned int prefixes;
307 unsigned char prefix[MAX_PREFIXES];
308
50128d0c 309 /* Register is in low 3 bits of opcode. */
5b7c81bd 310 bool short_form;
50128d0c 311
6f2f06be 312 /* The operand to a branch insn indicates an absolute branch. */
5b7c81bd 313 bool jumpabsolute;
6f2f06be 314
a4d3acd2
JB
315 /* The operand to a branch insn indicates a far branch. */
316 bool far_branch;
317
9373f275
L
318 /* There is a memory operand of (%dx) which should be only used
319 with input/output instructions. */
320 bool input_output_operand;
321
921eafea
L
322 /* Extended states. */
323 enum
324 {
325 /* Use MMX state. */
326 xstate_mmx = 1 << 0,
327 /* Use XMM state. */
328 xstate_xmm = 1 << 1,
329 /* Use YMM state. */
330 xstate_ymm = 1 << 2 | xstate_xmm,
331 /* Use ZMM state. */
332 xstate_zmm = 1 << 3 | xstate_ymm,
333 /* Use TMM state. */
32930e4e
L
334 xstate_tmm = 1 << 4,
335 /* Use MASK state. */
336 xstate_mask = 1 << 5
921eafea 337 } xstate;
260cd341 338
e379e5f3 339 /* Has GOTPC or TLS relocation. */
5b7c81bd 340 bool has_gotpc_tls_reloc;
e379e5f3 341
252b5132 342 /* RM and SIB are the modrm byte and the sib byte where the
c1e679ec 343 addressing modes of this insn are encoded. */
252b5132 344 modrm_byte rm;
3e73aa7c 345 rex_byte rex;
43234a1e 346 rex_byte vrex;
252b5132 347 sib_byte sib;
c0f3af97 348 vex_prefix vex;
b6169b20 349
6225c532
JB
350 /* Masking attributes.
351
352 The struct describes masking, applied to OPERAND in the instruction.
353 REG is a pointer to the corresponding mask register. ZEROING tells
354 whether merging or zeroing mask is used. */
355 struct Mask_Operation
356 {
357 const reg_entry *reg;
358 unsigned int zeroing;
359 /* The operand where this operation is associated. */
360 unsigned int operand;
361 } mask;
43234a1e
L
362
363 /* Rounding control and SAE attributes. */
ca5312a2
JB
364 struct RC_Operation
365 {
366 enum rc_type
367 {
368 rc_none = -1,
369 rne,
370 rd,
371 ru,
372 rz,
373 saeonly
374 } type;
7063667e
JB
375 /* In Intel syntax the operand modifier form is supposed to be used, but
376 we continue to accept the immediate forms as well. */
377 bool modifier;
ca5312a2 378 } rounding;
43234a1e 379
5273a3cd
JB
380 /* Broadcasting attributes.
381
382 The struct describes broadcasting, applied to OPERAND. TYPE is
383 expresses the broadcast factor. */
384 struct Broadcast_Operation
385 {
0cc78721 386 /* Type of broadcast: {1to2}, {1to4}, {1to8}, {1to16} or {1to32}. */
5273a3cd
JB
387 unsigned int type;
388
389 /* Index of broadcasted operand. */
390 unsigned int operand;
391
392 /* Number of bytes to broadcast. */
393 unsigned int bytes;
394 } broadcast;
43234a1e
L
395
396 /* Compressed disp8*N attribute. */
397 unsigned int memshift;
398
86fa6981
L
399 /* Prefer load or store in encoding. */
400 enum
401 {
402 dir_encoding_default = 0,
403 dir_encoding_load,
64c49ab3
JB
404 dir_encoding_store,
405 dir_encoding_swap
86fa6981 406 } dir_encoding;
891edac4 407
41eb8e88 408 /* Prefer 8bit, 16bit, 32bit displacement in encoding. */
a501d77e
L
409 enum
410 {
411 disp_encoding_default = 0,
412 disp_encoding_8bit,
41eb8e88 413 disp_encoding_16bit,
a501d77e
L
414 disp_encoding_32bit
415 } disp_encoding;
f8a5c266 416
6b6b6807 417 /* Prefer the REX byte in encoding. */
5b7c81bd 418 bool rex_encoding;
6b6b6807 419
b6f8c7c4 420 /* Disable instruction size optimization. */
5b7c81bd 421 bool no_optimize;
b6f8c7c4 422
86fa6981
L
423 /* How to encode vector instructions. */
424 enum
425 {
426 vex_encoding_default = 0,
42e04b36 427 vex_encoding_vex,
86fa6981 428 vex_encoding_vex3,
da4977e0
JB
429 vex_encoding_evex,
430 vex_encoding_error
86fa6981
L
431 } vec_encoding;
432
d5de92cf
L
433 /* REP prefix. */
434 const char *rep_prefix;
435
165de32a
L
436 /* HLE prefix. */
437 const char *hle_prefix;
42164a71 438
7e8b059b
L
439 /* Have BND prefix. */
440 const char *bnd_prefix;
441
04ef582a
L
442 /* Have NOTRACK prefix. */
443 const char *notrack_prefix;
444
891edac4 445 /* Error message. */
a65babc9 446 enum i386_error error;
252b5132
RH
447 };
448
449typedef struct _i386_insn i386_insn;
450
43234a1e
L
451/* Link RC type with corresponding string, that'll be looked for in
452 asm. */
453struct RC_name
454{
455 enum rc_type type;
456 const char *name;
457 unsigned int len;
458};
459
460static const struct RC_name RC_NamesTable[] =
461{
462 { rne, STRING_COMMA_LEN ("rn-sae") },
463 { rd, STRING_COMMA_LEN ("rd-sae") },
464 { ru, STRING_COMMA_LEN ("ru-sae") },
465 { rz, STRING_COMMA_LEN ("rz-sae") },
466 { saeonly, STRING_COMMA_LEN ("sae") },
467};
468
3bfea8ba
L
469/* To be indexed by segment register number. */
470static const unsigned char i386_seg_prefixes[] = {
471 ES_PREFIX_OPCODE,
472 CS_PREFIX_OPCODE,
473 SS_PREFIX_OPCODE,
474 DS_PREFIX_OPCODE,
475 FS_PREFIX_OPCODE,
476 GS_PREFIX_OPCODE
477};
478
252b5132
RH
479/* List of chars besides those in app.c:symbol_chars that can start an
480 operand. Used to prevent the scrubber eating vital white-space. */
86fa6981 481const char extra_symbol_chars[] = "*%-([{}"
252b5132 482#ifdef LEX_AT
32137342
NC
483 "@"
484#endif
485#ifdef LEX_QM
486 "?"
252b5132 487#endif
32137342 488 ;
252b5132 489
b3983e5f
JB
490#if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
491 && !defined (TE_GNU) \
492 && !defined (TE_LINUX) \
d85e70a3 493 && !defined (TE_Haiku) \
b3983e5f
JB
494 && !defined (TE_FreeBSD) \
495 && !defined (TE_DragonFly) \
496 && !defined (TE_NetBSD))
252b5132 497/* This array holds the chars that always start a comment. If the
b3b91714
AM
498 pre-processor is disabled, these aren't very useful. The option
499 --divide will remove '/' from this list. */
500const char *i386_comment_chars = "#/";
501#define SVR4_COMMENT_CHARS 1
252b5132 502#define PREFIX_SEPARATOR '\\'
252b5132 503
b3b91714
AM
504#else
505const char *i386_comment_chars = "#";
506#define PREFIX_SEPARATOR '/'
507#endif
508
252b5132
RH
509/* This array holds the chars that only start a comment at the beginning of
510 a line. If the line seems to have the form '# 123 filename'
ce8a8b2f
AM
511 .line and .file directives will appear in the pre-processed output.
512 Note that input_file.c hand checks for '#' at the beginning of the
252b5132 513 first line of the input file. This is because the compiler outputs
ce8a8b2f
AM
514 #NO_APP at the beginning of its output.
515 Also note that comments started like this one will always work if
252b5132 516 '/' isn't otherwise defined. */
b3b91714 517const char line_comment_chars[] = "#/";
252b5132 518
63a0b638 519const char line_separator_chars[] = ";";
252b5132 520
ce8a8b2f
AM
521/* Chars that can be used to separate mant from exp in floating point
522 nums. */
252b5132
RH
523const char EXP_CHARS[] = "eE";
524
ce8a8b2f
AM
525/* Chars that mean this number is a floating point constant
526 As in 0f12.456
527 or 0d1.2345e12. */
de133cf9 528const char FLT_CHARS[] = "fFdDxXhHbB";
252b5132 529
ce8a8b2f 530/* Tables for lexical analysis. */
252b5132
RH
531static char mnemonic_chars[256];
532static char register_chars[256];
533static char operand_chars[256];
534static char identifier_chars[256];
252b5132 535
ce8a8b2f 536/* Lexical macros. */
252b5132
RH
537#define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
538#define is_operand_char(x) (operand_chars[(unsigned char) x])
539#define is_register_char(x) (register_chars[(unsigned char) x])
540#define is_space_char(x) ((x) == ' ')
541#define is_identifier_char(x) (identifier_chars[(unsigned char) x])
252b5132 542
0234cb7c 543/* All non-digit non-letter characters that may occur in an operand. */
252b5132
RH
544static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
545
546/* md_assemble() always leaves the strings it's passed unaltered. To
547 effect this we maintain a stack of saved characters that we've smashed
548 with '\0's (indicating end of strings for various sub-fields of the
47926f60 549 assembler instruction). */
252b5132 550static char save_stack[32];
ce8a8b2f 551static char *save_stack_p;
252b5132
RH
552#define END_STRING_AND_SAVE(s) \
553 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
554#define RESTORE_END_STRING(s) \
555 do { *(s) = *--save_stack_p; } while (0)
556
47926f60 557/* The instruction we're assembling. */
252b5132
RH
558static i386_insn i;
559
560/* Possible templates for current insn. */
561static const templates *current_templates;
562
31b2323c
L
563/* Per instruction expressionS buffers: max displacements & immediates. */
564static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
565static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
252b5132 566
47926f60 567/* Current operand we are working on. */
ee86248c 568static int this_operand = -1;
252b5132 569
3e73aa7c
JH
570/* We support four different modes. FLAG_CODE variable is used to distinguish
571 these. */
572
573enum flag_code {
574 CODE_32BIT,
575 CODE_16BIT,
576 CODE_64BIT };
577
578static enum flag_code flag_code;
4fa24527 579static unsigned int object_64bit;
862be3fb 580static unsigned int disallow_64bit_reloc;
3e73aa7c 581static int use_rela_relocations = 0;
e379e5f3
L
582/* __tls_get_addr/___tls_get_addr symbol for TLS. */
583static const char *tls_get_addr;
3e73aa7c 584
7af8ed2d
NC
585#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
586 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
587 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
588
351f65ca
L
589/* The ELF ABI to use. */
590enum x86_elf_abi
591{
592 I386_ABI,
7f56bc95
L
593 X86_64_ABI,
594 X86_64_X32_ABI
351f65ca
L
595};
596
597static enum x86_elf_abi x86_elf_abi = I386_ABI;
7af8ed2d 598#endif
351f65ca 599
167ad85b
TG
600#if defined (TE_PE) || defined (TE_PEP)
601/* Use big object file format. */
602static int use_big_obj = 0;
603#endif
604
8dcea932
L
605#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
606/* 1 if generating code for a shared library. */
607static int shared = 0;
b52c4ee4
IB
608
609unsigned int x86_sframe_cfa_sp_reg;
3e3e792a 610/* The other CFA base register for SFrame stack trace info. */
b52c4ee4
IB
611unsigned int x86_sframe_cfa_fp_reg;
612unsigned int x86_sframe_cfa_ra_reg;
613
8dcea932
L
614#endif
615
47926f60
KH
616/* 1 for intel syntax,
617 0 if att syntax. */
618static int intel_syntax = 0;
252b5132 619
4b5aaf5f
L
620static enum x86_64_isa
621{
622 amd64 = 1, /* AMD64 ISA. */
623 intel64 /* Intel64 ISA. */
624} isa64;
e89c5eaa 625
1efbbeb4
L
626/* 1 for intel mnemonic,
627 0 if att mnemonic. */
628static int intel_mnemonic = !SYSV386_COMPAT;
629
a60de03c
JB
630/* 1 if pseudo registers are permitted. */
631static int allow_pseudo_reg = 0;
632
47926f60
KH
633/* 1 if register prefix % not required. */
634static int allow_naked_reg = 0;
252b5132 635
33eaf5de 636/* 1 if the assembler should add BND prefix for all control-transferring
7e8b059b
L
637 instructions supporting it, even if this prefix wasn't specified
638 explicitly. */
639static int add_bnd_prefix = 0;
640
ba104c83 641/* 1 if pseudo index register, eiz/riz, is allowed . */
db51cc60
L
642static int allow_index_reg = 0;
643
d022bddd
IT
644/* 1 if the assembler should ignore LOCK prefix, even if it was
645 specified explicitly. */
646static int omit_lock_prefix = 0;
647
e4e00185
AS
648/* 1 if the assembler should encode lfence, mfence, and sfence as
649 "lock addl $0, (%{re}sp)". */
650static int avoid_fence = 0;
651
ae531041
L
652/* 1 if lfence should be inserted after every load. */
653static int lfence_after_load = 0;
654
655/* Non-zero if lfence should be inserted before indirect branch. */
656static enum lfence_before_indirect_branch_kind
657 {
658 lfence_branch_none = 0,
659 lfence_branch_register,
660 lfence_branch_memory,
661 lfence_branch_all
662 }
663lfence_before_indirect_branch;
664
665/* Non-zero if lfence should be inserted before ret. */
666static enum lfence_before_ret_kind
667 {
668 lfence_before_ret_none = 0,
669 lfence_before_ret_not,
a09f656b 670 lfence_before_ret_or,
671 lfence_before_ret_shl
ae531041
L
672 }
673lfence_before_ret;
674
675/* Types of previous instruction is .byte or prefix. */
e379e5f3
L
676static struct
677 {
678 segT seg;
679 const char *file;
680 const char *name;
681 unsigned int line;
682 enum last_insn_kind
683 {
684 last_insn_other = 0,
685 last_insn_directive,
686 last_insn_prefix
687 } kind;
688 } last_insn;
689
0cb4071e
L
690/* 1 if the assembler should generate relax relocations. */
691
692static int generate_relax_relocations
693 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
694
7bab8ab5 695static enum check_kind
daf50ae7 696 {
7bab8ab5
JB
697 check_none = 0,
698 check_warning,
699 check_error
daf50ae7 700 }
7bab8ab5 701sse_check, operand_check = check_warning;
daf50ae7 702
e379e5f3
L
703/* Non-zero if branches should be aligned within power of 2 boundary. */
704static int align_branch_power = 0;
705
706/* Types of branches to align. */
707enum align_branch_kind
708 {
709 align_branch_none = 0,
710 align_branch_jcc = 1,
711 align_branch_fused = 2,
712 align_branch_jmp = 3,
713 align_branch_call = 4,
714 align_branch_indirect = 5,
715 align_branch_ret = 6
716 };
717
718/* Type bits of branches to align. */
719enum align_branch_bit
720 {
721 align_branch_jcc_bit = 1 << align_branch_jcc,
722 align_branch_fused_bit = 1 << align_branch_fused,
723 align_branch_jmp_bit = 1 << align_branch_jmp,
724 align_branch_call_bit = 1 << align_branch_call,
725 align_branch_indirect_bit = 1 << align_branch_indirect,
726 align_branch_ret_bit = 1 << align_branch_ret
727 };
728
729static unsigned int align_branch = (align_branch_jcc_bit
730 | align_branch_fused_bit
731 | align_branch_jmp_bit);
732
79d72f45
HL
733/* Types of condition jump used by macro-fusion. */
734enum mf_jcc_kind
735 {
736 mf_jcc_jo = 0, /* base opcode 0x70 */
737 mf_jcc_jc, /* base opcode 0x72 */
738 mf_jcc_je, /* base opcode 0x74 */
739 mf_jcc_jna, /* base opcode 0x76 */
740 mf_jcc_js, /* base opcode 0x78 */
741 mf_jcc_jp, /* base opcode 0x7a */
742 mf_jcc_jl, /* base opcode 0x7c */
743 mf_jcc_jle, /* base opcode 0x7e */
744 };
745
746/* Types of compare flag-modifying insntructions used by macro-fusion. */
747enum mf_cmp_kind
748 {
749 mf_cmp_test_and, /* test/cmp */
750 mf_cmp_alu_cmp, /* add/sub/cmp */
751 mf_cmp_incdec /* inc/dec */
752 };
753
e379e5f3
L
754/* The maximum padding size for fused jcc. CMP like instruction can
755 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
756 prefixes. */
757#define MAX_FUSED_JCC_PADDING_SIZE 20
758
759/* The maximum number of prefixes added for an instruction. */
760static unsigned int align_branch_prefix_size = 5;
761
b6f8c7c4
L
762/* Optimization:
763 1. Clear the REX_W bit with register operand if possible.
764 2. Above plus use 128bit vector instruction to clear the full vector
765 register.
766 */
767static int optimize = 0;
768
769/* Optimization:
770 1. Clear the REX_W bit with register operand if possible.
771 2. Above plus use 128bit vector instruction to clear the full vector
772 register.
773 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
774 "testb $imm7,%r8".
775 */
776static int optimize_for_space = 0;
777
2ca3ace5
L
778/* Register prefix used for error message. */
779static const char *register_prefix = "%";
780
47926f60
KH
781/* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
782 leave, push, and pop instructions so that gcc has the same stack
783 frame as in 32 bit mode. */
784static char stackop_size = '\0';
eecb386c 785
12b55ccc
L
786/* Non-zero to optimize code alignment. */
787int optimize_align_code = 1;
788
47926f60
KH
789/* Non-zero to quieten some warnings. */
790static int quiet_warnings = 0;
a38cf1db 791
d59a54c2
JB
792/* Guard to avoid repeated warnings about non-16-bit code on 16-bit CPUs. */
793static bool pre_386_16bit_warned;
794
47926f60
KH
795/* CPU name. */
796static const char *cpu_arch_name = NULL;
6305a203 797static char *cpu_sub_arch_name = NULL;
a38cf1db 798
47926f60 799/* CPU feature flags. */
40fb9820
L
800static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
801
ccc9c027
L
802/* If we have selected a cpu we are generating instructions for. */
803static int cpu_arch_tune_set = 0;
804
9103f4f4 805/* Cpu we are generating instructions for. */
fbf3f584 806enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
9103f4f4
L
807
808/* CPU feature flags of cpu we are generating instructions for. */
40fb9820 809static i386_cpu_flags cpu_arch_tune_flags;
9103f4f4 810
ccc9c027 811/* CPU instruction set architecture used. */
fbf3f584 812enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
ccc9c027 813
9103f4f4 814/* CPU feature flags of instruction set architecture used. */
fbf3f584 815i386_cpu_flags cpu_arch_isa_flags;
9103f4f4 816
fddf5b5b
AM
817/* If set, conditional jumps are not automatically promoted to handle
818 larger than a byte offset. */
f68697e8 819static bool no_cond_jump_promotion = false;
fddf5b5b 820
c0f3af97
L
821/* Encode SSE instructions with VEX prefix. */
822static unsigned int sse2avx;
823
c8480b58
L
824/* Encode aligned vector move as unaligned vector move. */
825static unsigned int use_unaligned_vector_move;
826
539f890d
L
827/* Encode scalar AVX instructions with specific vector length. */
828static enum
829 {
830 vex128 = 0,
831 vex256
832 } avxscalar;
833
03751133
L
834/* Encode VEX WIG instructions with specific vex.w. */
835static enum
836 {
837 vexw0 = 0,
838 vexw1
839 } vexwig;
840
43234a1e
L
841/* Encode scalar EVEX LIG instructions with specific vector length. */
842static enum
843 {
844 evexl128 = 0,
845 evexl256,
846 evexl512
847 } evexlig;
848
849/* Encode EVEX WIG instructions with specific evex.w. */
850static enum
851 {
852 evexw0 = 0,
853 evexw1
854 } evexwig;
855
d3d3c6db
IT
856/* Value to encode in EVEX RC bits, for SAE-only instructions. */
857static enum rc_type evexrcig = rne;
858
29b0f896 859/* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
87c245cc 860static symbolS *GOT_symbol;
29b0f896 861
a4447b93
RH
862/* The dwarf2 return column, adjusted for 32 or 64 bit. */
863unsigned int x86_dwarf2_return_column;
864
865/* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
866int x86_cie_data_alignment;
867
252b5132 868/* Interface to relax_segment.
fddf5b5b
AM
869 There are 3 major relax states for 386 jump insns because the
870 different types of jumps add different sizes to frags when we're
e379e5f3
L
871 figuring out what sort of jump to choose to reach a given label.
872
873 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
874 branches which are handled by md_estimate_size_before_relax() and
875 i386_generic_table_relax_frag(). */
252b5132 876
47926f60 877/* Types. */
93c2a809
AM
878#define UNCOND_JUMP 0
879#define COND_JUMP 1
880#define COND_JUMP86 2
e379e5f3
L
881#define BRANCH_PADDING 3
882#define BRANCH_PREFIX 4
883#define FUSED_JCC_PADDING 5
fddf5b5b 884
47926f60 885/* Sizes. */
252b5132
RH
886#define CODE16 1
887#define SMALL 0
29b0f896 888#define SMALL16 (SMALL | CODE16)
252b5132 889#define BIG 2
29b0f896 890#define BIG16 (BIG | CODE16)
252b5132
RH
891
892#ifndef INLINE
893#ifdef __GNUC__
894#define INLINE __inline__
895#else
896#define INLINE
897#endif
898#endif
899
fddf5b5b
AM
900#define ENCODE_RELAX_STATE(type, size) \
901 ((relax_substateT) (((type) << 2) | (size)))
902#define TYPE_FROM_RELAX_STATE(s) \
903 ((s) >> 2)
904#define DISP_SIZE_FROM_RELAX_STATE(s) \
905 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
252b5132
RH
906
907/* This table is used by relax_frag to promote short jumps to long
908 ones where necessary. SMALL (short) jumps may be promoted to BIG
909 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
910 don't allow a short jump in a 32 bit code segment to be promoted to
911 a 16 bit offset jump because it's slower (requires data size
912 prefix), and doesn't work, unless the destination is in the bottom
913 64k of the code segment (The top 16 bits of eip are zeroed). */
914
915const relax_typeS md_relax_table[] =
916{
24eab124
AM
917 /* The fields are:
918 1) most positive reach of this state,
919 2) most negative reach of this state,
93c2a809 920 3) how many bytes this mode will have in the variable part of the frag
ce8a8b2f 921 4) which index into the table to try if we can't fit into this one. */
252b5132 922
fddf5b5b 923 /* UNCOND_JUMP states. */
93c2a809
AM
924 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
925 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
926 /* dword jmp adds 4 bytes to frag:
927 0 extra opcode bytes, 4 displacement bytes. */
252b5132 928 {0, 0, 4, 0},
93c2a809
AM
929 /* word jmp adds 2 byte2 to frag:
930 0 extra opcode bytes, 2 displacement bytes. */
252b5132
RH
931 {0, 0, 2, 0},
932
93c2a809
AM
933 /* COND_JUMP states. */
934 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
935 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
936 /* dword conditionals adds 5 bytes to frag:
937 1 extra opcode byte, 4 displacement bytes. */
938 {0, 0, 5, 0},
fddf5b5b 939 /* word conditionals add 3 bytes to frag:
93c2a809
AM
940 1 extra opcode byte, 2 displacement bytes. */
941 {0, 0, 3, 0},
942
943 /* COND_JUMP86 states. */
944 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
945 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
946 /* dword conditionals adds 5 bytes to frag:
947 1 extra opcode byte, 4 displacement bytes. */
948 {0, 0, 5, 0},
949 /* word conditionals add 4 bytes to frag:
950 1 displacement byte and a 3 byte long branch insn. */
951 {0, 0, 4, 0}
252b5132
RH
952};
953
6ceeed25 954#define ARCH(n, t, f, s) \
ae89daec
JB
955 { STRING_COMMA_LEN (#n), s, PROCESSOR_ ## t, CPU_ ## f ## _FLAGS, \
956 CPU_NONE_FLAGS }
957#define SUBARCH(n, e, d, s) \
958 { STRING_COMMA_LEN (#n), s, PROCESSOR_NONE, CPU_ ## e ## _FLAGS, \
959 CPU_ ## d ## _FLAGS }
6ceeed25 960
9103f4f4
L
961static const arch_entry cpu_arch[] =
962{
3ce2ebcf
JB
963 /* Do not replace the first two entries - i386_target_format() and
964 set_cpu_arch() rely on them being there in this order. */
6ceeed25
JB
965 ARCH (generic32, GENERIC32, GENERIC32, false),
966 ARCH (generic64, GENERIC64, GENERIC64, false),
967 ARCH (i8086, UNKNOWN, NONE, false),
4d97c5c8
JB
968 ARCH (i186, UNKNOWN, 186, false),
969 ARCH (i286, UNKNOWN, 286, false),
970 ARCH (i386, I386, 386, false),
971 ARCH (i486, I486, 486, false),
972 ARCH (i586, PENTIUM, 586, false),
973 ARCH (i686, PENTIUMPRO, 686, false),
974 ARCH (pentium, PENTIUM, 586, false),
6ceeed25
JB
975 ARCH (pentiumpro, PENTIUMPRO, PENTIUMPRO, false),
976 ARCH (pentiumii, PENTIUMPRO, P2, false),
977 ARCH (pentiumiii, PENTIUMPRO, P3, false),
978 ARCH (pentium4, PENTIUM4, P4, false),
979 ARCH (prescott, NOCONA, CORE, false),
980 ARCH (nocona, NOCONA, NOCONA, false),
981 ARCH (yonah, CORE, CORE, true),
982 ARCH (core, CORE, CORE, false),
983 ARCH (merom, CORE2, CORE2, true),
984 ARCH (core2, CORE2, CORE2, false),
985 ARCH (corei7, COREI7, COREI7, false),
986 ARCH (iamcu, IAMCU, IAMCU, false),
987 ARCH (k6, K6, K6, false),
988 ARCH (k6_2, K6, K6_2, false),
989 ARCH (athlon, ATHLON, ATHLON, false),
990 ARCH (sledgehammer, K8, K8, true),
991 ARCH (opteron, K8, K8, false),
992 ARCH (k8, K8, K8, false),
993 ARCH (amdfam10, AMDFAM10, AMDFAM10, false),
994 ARCH (bdver1, BD, BDVER1, false),
995 ARCH (bdver2, BD, BDVER2, false),
996 ARCH (bdver3, BD, BDVER3, false),
997 ARCH (bdver4, BD, BDVER4, false),
998 ARCH (znver1, ZNVER, ZNVER1, false),
999 ARCH (znver2, ZNVER, ZNVER2, false),
1000 ARCH (znver3, ZNVER, ZNVER3, false),
b0e8fa7f 1001 ARCH (znver4, ZNVER, ZNVER4, false),
6ceeed25
JB
1002 ARCH (btver1, BT, BTVER1, false),
1003 ARCH (btver2, BT, BTVER2, false),
1004
4d97c5c8
JB
1005 SUBARCH (8087, 8087, ANY_8087, false),
1006 SUBARCH (87, NONE, ANY_8087, false), /* Disable only! */
ae89daec
JB
1007 SUBARCH (287, 287, ANY_287, false),
1008 SUBARCH (387, 387, ANY_387, false),
1009 SUBARCH (687, 687, ANY_687, false),
4d97c5c8 1010 SUBARCH (cmov, CMOV, CMOV, false),
88bd2203 1011 SUBARCH (fxsr, FXSR, ANY_FXSR, false),
ae89daec
JB
1012 SUBARCH (mmx, MMX, ANY_MMX, false),
1013 SUBARCH (sse, SSE, ANY_SSE, false),
1014 SUBARCH (sse2, SSE2, ANY_SSE2, false),
1015 SUBARCH (sse3, SSE3, ANY_SSE3, false),
1016 SUBARCH (sse4a, SSE4A, ANY_SSE4A, false),
1017 SUBARCH (ssse3, SSSE3, ANY_SSSE3, false),
1018 SUBARCH (sse4.1, SSE4_1, ANY_SSE4_1, false),
1019 SUBARCH (sse4.2, SSE4_2, ANY_SSE4_2, false),
1020 SUBARCH (sse4, SSE4_2, ANY_SSE4_1, false),
1021 SUBARCH (avx, AVX, ANY_AVX, false),
1022 SUBARCH (avx2, AVX2, ANY_AVX2, false),
1023 SUBARCH (avx512f, AVX512F, ANY_AVX512F, false),
1024 SUBARCH (avx512cd, AVX512CD, ANY_AVX512CD, false),
1025 SUBARCH (avx512er, AVX512ER, ANY_AVX512ER, false),
1026 SUBARCH (avx512pf, AVX512PF, ANY_AVX512PF, false),
1027 SUBARCH (avx512dq, AVX512DQ, ANY_AVX512DQ, false),
1028 SUBARCH (avx512bw, AVX512BW, ANY_AVX512BW, false),
1029 SUBARCH (avx512vl, AVX512VL, ANY_AVX512VL, false),
cafa5ef7 1030 SUBARCH (monitor, MONITOR, MONITOR, false),
25626f79
JB
1031 SUBARCH (vmx, VMX, ANY_VMX, false),
1032 SUBARCH (vmfunc, VMFUNC, ANY_VMFUNC, false),
ae89daec 1033 SUBARCH (smx, SMX, SMX, false),
5091b9ee
JB
1034 SUBARCH (xsave, XSAVE, ANY_XSAVE, false),
1035 SUBARCH (xsaveopt, XSAVEOPT, ANY_XSAVEOPT, false),
1036 SUBARCH (xsavec, XSAVEC, ANY_XSAVEC, false),
1037 SUBARCH (xsaves, XSAVES, ANY_XSAVES, false),
1038 SUBARCH (aes, AES, ANY_AES, false),
1039 SUBARCH (pclmul, PCLMUL, ANY_PCLMUL, false),
1040 SUBARCH (clmul, PCLMUL, ANY_PCLMUL, true),
ae89daec
JB
1041 SUBARCH (fsgsbase, FSGSBASE, FSGSBASE, false),
1042 SUBARCH (rdrnd, RDRND, RDRND, false),
5091b9ee 1043 SUBARCH (f16c, F16C, ANY_F16C, false),
ae89daec 1044 SUBARCH (bmi2, BMI2, BMI2, false),
5091b9ee
JB
1045 SUBARCH (fma, FMA, ANY_FMA, false),
1046 SUBARCH (fma4, FMA4, ANY_FMA4, false),
1047 SUBARCH (xop, XOP, ANY_XOP, false),
1048 SUBARCH (lwp, LWP, ANY_LWP, false),
ae89daec
JB
1049 SUBARCH (movbe, MOVBE, MOVBE, false),
1050 SUBARCH (cx16, CX16, CX16, false),
c3bb24f5 1051 SUBARCH (lahf_sahf, LAHF_SAHF, LAHF_SAHF, false),
25626f79 1052 SUBARCH (ept, EPT, ANY_EPT, false),
ae89daec
JB
1053 SUBARCH (lzcnt, LZCNT, LZCNT, false),
1054 SUBARCH (popcnt, POPCNT, POPCNT, false),
1055 SUBARCH (hle, HLE, HLE, false),
760ab3d0
JB
1056 SUBARCH (rtm, RTM, ANY_RTM, false),
1057 SUBARCH (tsx, TSX, TSX, false),
ae89daec
JB
1058 SUBARCH (invpcid, INVPCID, INVPCID, false),
1059 SUBARCH (clflush, CLFLUSH, CLFLUSH, false),
1060 SUBARCH (nop, NOP, NOP, false),
1061 SUBARCH (syscall, SYSCALL, SYSCALL, false),
1062 SUBARCH (rdtscp, RDTSCP, RDTSCP, false),
5091b9ee
JB
1063 SUBARCH (3dnow, 3DNOW, ANY_3DNOW, false),
1064 SUBARCH (3dnowa, 3DNOWA, ANY_3DNOWA, false),
ae89daec 1065 SUBARCH (padlock, PADLOCK, PADLOCK, false),
0919e770
JB
1066 SUBARCH (pacifica, SVME, ANY_SVME, true),
1067 SUBARCH (svme, SVME, ANY_SVME, false),
ae89daec
JB
1068 SUBARCH (abm, ABM, ABM, false),
1069 SUBARCH (bmi, BMI, BMI, false),
1070 SUBARCH (tbm, TBM, TBM, false),
1071 SUBARCH (adx, ADX, ADX, false),
1072 SUBARCH (rdseed, RDSEED, RDSEED, false),
1073 SUBARCH (prfchw, PRFCHW, PRFCHW, false),
1074 SUBARCH (smap, SMAP, SMAP, false),
5091b9ee
JB
1075 SUBARCH (mpx, MPX, ANY_MPX, false),
1076 SUBARCH (sha, SHA, ANY_SHA, false),
ae89daec
JB
1077 SUBARCH (clflushopt, CLFLUSHOPT, CLFLUSHOPT, false),
1078 SUBARCH (prefetchwt1, PREFETCHWT1, PREFETCHWT1, false),
1079 SUBARCH (se1, SE1, SE1, false),
1080 SUBARCH (clwb, CLWB, CLWB, false),
1081 SUBARCH (avx512ifma, AVX512IFMA, ANY_AVX512IFMA, false),
1082 SUBARCH (avx512vbmi, AVX512VBMI, ANY_AVX512VBMI, false),
1083 SUBARCH (avx512_4fmaps, AVX512_4FMAPS, ANY_AVX512_4FMAPS, false),
1084 SUBARCH (avx512_4vnniw, AVX512_4VNNIW, ANY_AVX512_4VNNIW, false),
1085 SUBARCH (avx512_vpopcntdq, AVX512_VPOPCNTDQ, ANY_AVX512_VPOPCNTDQ, false),
1086 SUBARCH (avx512_vbmi2, AVX512_VBMI2, ANY_AVX512_VBMI2, false),
1087 SUBARCH (avx512_vnni, AVX512_VNNI, ANY_AVX512_VNNI, false),
1088 SUBARCH (avx512_bitalg, AVX512_BITALG, ANY_AVX512_BITALG, false),
1089 SUBARCH (avx_vnni, AVX_VNNI, ANY_AVX_VNNI, false),
1090 SUBARCH (clzero, CLZERO, CLZERO, false),
1091 SUBARCH (mwaitx, MWAITX, MWAITX, false),
5091b9ee 1092 SUBARCH (ospke, OSPKE, ANY_OSPKE, false),
ae89daec
JB
1093 SUBARCH (rdpid, RDPID, RDPID, false),
1094 SUBARCH (ptwrite, PTWRITE, PTWRITE, false),
4d97c5c8
JB
1095 SUBARCH (ibt, IBT, IBT, false),
1096 SUBARCH (shstk, SHSTK, SHSTK, false),
88bd2203 1097 SUBARCH (gfni, GFNI, ANY_GFNI, false),
b20f4261
JB
1098 SUBARCH (vaes, VAES, ANY_VAES, false),
1099 SUBARCH (vpclmulqdq, VPCLMULQDQ, ANY_VPCLMULQDQ, false),
ae89daec
JB
1100 SUBARCH (wbnoinvd, WBNOINVD, WBNOINVD, false),
1101 SUBARCH (pconfig, PCONFIG, PCONFIG, false),
1102 SUBARCH (waitpkg, WAITPKG, WAITPKG, false),
1103 SUBARCH (cldemote, CLDEMOTE, CLDEMOTE, false),
1104 SUBARCH (amx_int8, AMX_INT8, ANY_AMX_INT8, false),
1105 SUBARCH (amx_bf16, AMX_BF16, ANY_AMX_BF16, false),
5091b9ee 1106 SUBARCH (amx_fp16, AMX_FP16, ANY_AMX_FP16, false),
ae89daec 1107 SUBARCH (amx_tile, AMX_TILE, ANY_AMX_TILE, false),
4d97c5c8
JB
1108 SUBARCH (movdiri, MOVDIRI, MOVDIRI, false),
1109 SUBARCH (movdir64b, MOVDIR64B, MOVDIR64B, false),
ae89daec
JB
1110 SUBARCH (avx512_bf16, AVX512_BF16, ANY_AVX512_BF16, false),
1111 SUBARCH (avx512_vp2intersect, AVX512_VP2INTERSECT,
1112 ANY_AVX512_VP2INTERSECT, false),
4d97c5c8
JB
1113 SUBARCH (tdx, TDX, TDX, false),
1114 SUBARCH (enqcmd, ENQCMD, ENQCMD, false),
1115 SUBARCH (serialize, SERIALIZE, SERIALIZE, false),
ae89daec
JB
1116 SUBARCH (rdpru, RDPRU, RDPRU, false),
1117 SUBARCH (mcommit, MCOMMIT, MCOMMIT, false),
0919e770 1118 SUBARCH (sev_es, SEV_ES, ANY_SEV_ES, false),
760ab3d0 1119 SUBARCH (tsxldtrk, TSXLDTRK, ANY_TSXLDTRK, false),
88bd2203
JB
1120 SUBARCH (kl, KL, ANY_KL, false),
1121 SUBARCH (widekl, WIDEKL, ANY_WIDEKL, false),
4d97c5c8
JB
1122 SUBARCH (uintr, UINTR, UINTR, false),
1123 SUBARCH (hreset, HRESET, HRESET, false),
ae89daec 1124 SUBARCH (avx512_fp16, AVX512_FP16, ANY_AVX512_FP16, false),
ef07be45 1125 SUBARCH (prefetchi, PREFETCHI, PREFETCHI, false),
4321af3e 1126 SUBARCH (avx_ifma, AVX_IFMA, ANY_AVX_IFMA, false),
23ae61ad 1127 SUBARCH (avx_vnni_int8, AVX_VNNI_INT8, ANY_AVX_VNNI_INT8, false),
4d97c5c8
JB
1128 SUBARCH (cmpccxadd, CMPCCXADD, CMPCCXADD, false),
1129 SUBARCH (wrmsrns, WRMSRNS, WRMSRNS, false),
1130 SUBARCH (msrlist, MSRLIST, MSRLIST, false),
01d8ce74 1131 SUBARCH (avx_ne_convert, AVX_NE_CONVERT, ANY_AVX_NE_CONVERT, false),
4d97c5c8 1132 SUBARCH (rao_int, RAO_INT, RAO_INT, false),
0919e770 1133 SUBARCH (rmpquery, RMPQUERY, ANY_RMPQUERY, false),
293f5f65
L
1134};
1135
6ceeed25
JB
1136#undef SUBARCH
1137#undef ARCH
1138
704209c0 1139#ifdef I386COFF
a6c24e68
NC
1140/* Like s_lcomm_internal in gas/read.c but the alignment string
1141 is allowed to be optional. */
1142
1143static symbolS *
1144pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1145{
1146 addressT align = 0;
1147
1148 SKIP_WHITESPACE ();
1149
7ab9ffdd 1150 if (needs_align
a6c24e68
NC
1151 && *input_line_pointer == ',')
1152 {
1153 align = parse_align (needs_align - 1);
7ab9ffdd 1154
a6c24e68
NC
1155 if (align == (addressT) -1)
1156 return NULL;
1157 }
1158 else
1159 {
1160 if (size >= 8)
1161 align = 3;
1162 else if (size >= 4)
1163 align = 2;
1164 else if (size >= 2)
1165 align = 1;
1166 else
1167 align = 0;
1168 }
1169
1170 bss_alloc (symbolP, size, align);
1171 return symbolP;
1172}
1173
704209c0 1174static void
a6c24e68
NC
1175pe_lcomm (int needs_align)
1176{
1177 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1178}
704209c0 1179#endif
a6c24e68 1180
29b0f896
AM
1181const pseudo_typeS md_pseudo_table[] =
1182{
1183#if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1184 {"align", s_align_bytes, 0},
1185#else
1186 {"align", s_align_ptwo, 0},
1187#endif
1188 {"arch", set_cpu_arch, 0},
1189#ifndef I386COFF
1190 {"bss", s_bss, 0},
a6c24e68
NC
1191#else
1192 {"lcomm", pe_lcomm, 1},
29b0f896
AM
1193#endif
1194 {"ffloat", float_cons, 'f'},
1195 {"dfloat", float_cons, 'd'},
1196 {"tfloat", float_cons, 'x'},
7d19d096 1197 {"hfloat", float_cons, 'h'},
de133cf9 1198 {"bfloat16", float_cons, 'b'},
29b0f896 1199 {"value", cons, 2},
d182319b 1200 {"slong", signed_cons, 4},
29b0f896
AM
1201 {"noopt", s_ignore, 0},
1202 {"optim", s_ignore, 0},
1203 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1204 {"code16", set_code_flag, CODE_16BIT},
1205 {"code32", set_code_flag, CODE_32BIT},
da5f19a2 1206#ifdef BFD64
29b0f896 1207 {"code64", set_code_flag, CODE_64BIT},
da5f19a2 1208#endif
29b0f896
AM
1209 {"intel_syntax", set_intel_syntax, 1},
1210 {"att_syntax", set_intel_syntax, 0},
1efbbeb4
L
1211 {"intel_mnemonic", set_intel_mnemonic, 1},
1212 {"att_mnemonic", set_intel_mnemonic, 0},
db51cc60
L
1213 {"allow_index_reg", set_allow_index_reg, 1},
1214 {"disallow_index_reg", set_allow_index_reg, 0},
7bab8ab5
JB
1215 {"sse_check", set_check, 0},
1216 {"operand_check", set_check, 1},
3b22753a
L
1217#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1218 {"largecomm", handle_large_common, 0},
07a53e5c 1219#else
68d20676 1220 {"file", dwarf2_directive_file, 0},
07a53e5c
RH
1221 {"loc", dwarf2_directive_loc, 0},
1222 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
3b22753a 1223#endif
6482c264
NC
1224#ifdef TE_PE
1225 {"secrel32", pe_directive_secrel, 0},
145667f8 1226 {"secidx", pe_directive_secidx, 0},
6482c264 1227#endif
29b0f896
AM
1228 {0, 0, 0}
1229};
1230
1231/* For interface with expression (). */
1232extern char *input_line_pointer;
1233
1234/* Hash table for instruction mnemonic lookup. */
629310ab 1235static htab_t op_hash;
29b0f896
AM
1236
1237/* Hash table for register lookup. */
629310ab 1238static htab_t reg_hash;
29b0f896 1239\f
ce8a8b2f
AM
1240 /* Various efficient no-op patterns for aligning code labels.
1241 Note: Don't try to assemble the instructions in the comments.
1242 0L and 0w are not legal. */
62a02d25
L
1243static const unsigned char f32_1[] =
1244 {0x90}; /* nop */
1245static const unsigned char f32_2[] =
1246 {0x66,0x90}; /* xchg %ax,%ax */
1247static const unsigned char f32_3[] =
1248 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1249static const unsigned char f32_4[] =
1250 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
62a02d25
L
1251static const unsigned char f32_6[] =
1252 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1253static const unsigned char f32_7[] =
1254 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
62a02d25 1255static const unsigned char f16_3[] =
3ae729d5 1256 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
62a02d25 1257static const unsigned char f16_4[] =
3ae729d5
L
1258 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1259static const unsigned char jump_disp8[] =
1260 {0xeb}; /* jmp disp8 */
1261static const unsigned char jump32_disp32[] =
1262 {0xe9}; /* jmp disp32 */
1263static const unsigned char jump16_disp32[] =
1264 {0x66,0xe9}; /* jmp disp32 */
62a02d25
L
1265/* 32-bit NOPs patterns. */
1266static const unsigned char *const f32_patt[] = {
3ae729d5 1267 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
62a02d25
L
1268};
1269/* 16-bit NOPs patterns. */
1270static const unsigned char *const f16_patt[] = {
3ae729d5 1271 f32_1, f32_2, f16_3, f16_4
62a02d25
L
1272};
1273/* nopl (%[re]ax) */
1274static const unsigned char alt_3[] =
1275 {0x0f,0x1f,0x00};
1276/* nopl 0(%[re]ax) */
1277static const unsigned char alt_4[] =
1278 {0x0f,0x1f,0x40,0x00};
1279/* nopl 0(%[re]ax,%[re]ax,1) */
1280static const unsigned char alt_5[] =
1281 {0x0f,0x1f,0x44,0x00,0x00};
1282/* nopw 0(%[re]ax,%[re]ax,1) */
1283static const unsigned char alt_6[] =
1284 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1285/* nopl 0L(%[re]ax) */
1286static const unsigned char alt_7[] =
1287 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1288/* nopl 0L(%[re]ax,%[re]ax,1) */
1289static const unsigned char alt_8[] =
1290 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1291/* nopw 0L(%[re]ax,%[re]ax,1) */
1292static const unsigned char alt_9[] =
1293 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1294/* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1295static const unsigned char alt_10[] =
1296 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
3ae729d5
L
1297/* data16 nopw %cs:0L(%eax,%eax,1) */
1298static const unsigned char alt_11[] =
1299 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
62a02d25
L
1300/* 32-bit and 64-bit NOPs patterns. */
1301static const unsigned char *const alt_patt[] = {
1302 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
3ae729d5 1303 alt_9, alt_10, alt_11
62a02d25
L
1304};
1305
1306/* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1307 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1308
1309static void
1310i386_output_nops (char *where, const unsigned char *const *patt,
1311 int count, int max_single_nop_size)
1312
1313{
3ae729d5
L
1314 /* Place the longer NOP first. */
1315 int last;
1316 int offset;
3076e594
NC
1317 const unsigned char *nops;
1318
1319 if (max_single_nop_size < 1)
1320 {
1321 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1322 max_single_nop_size);
1323 return;
1324 }
1325
1326 nops = patt[max_single_nop_size - 1];
3ae729d5
L
1327
1328 /* Use the smaller one if the requsted one isn't available. */
1329 if (nops == NULL)
62a02d25 1330 {
3ae729d5
L
1331 max_single_nop_size--;
1332 nops = patt[max_single_nop_size - 1];
62a02d25
L
1333 }
1334
3ae729d5
L
1335 last = count % max_single_nop_size;
1336
1337 count -= last;
1338 for (offset = 0; offset < count; offset += max_single_nop_size)
1339 memcpy (where + offset, nops, max_single_nop_size);
1340
1341 if (last)
1342 {
1343 nops = patt[last - 1];
1344 if (nops == NULL)
1345 {
1346 /* Use the smaller one plus one-byte NOP if the needed one
1347 isn't available. */
1348 last--;
1349 nops = patt[last - 1];
1350 memcpy (where + offset, nops, last);
1351 where[offset + last] = *patt[0];
1352 }
1353 else
1354 memcpy (where + offset, nops, last);
1355 }
62a02d25
L
1356}
1357
3ae729d5
L
1358static INLINE int
1359fits_in_imm7 (offsetT num)
1360{
1361 return (num & 0x7f) == num;
1362}
1363
1364static INLINE int
1365fits_in_imm31 (offsetT num)
1366{
1367 return (num & 0x7fffffff) == num;
1368}
62a02d25
L
1369
1370/* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1371 single NOP instruction LIMIT. */
1372
1373void
3ae729d5 1374i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
62a02d25 1375{
3ae729d5 1376 const unsigned char *const *patt = NULL;
62a02d25 1377 int max_single_nop_size;
3ae729d5
L
1378 /* Maximum number of NOPs before switching to jump over NOPs. */
1379 int max_number_of_nops;
62a02d25 1380
3ae729d5 1381 switch (fragP->fr_type)
62a02d25 1382 {
3ae729d5
L
1383 case rs_fill_nop:
1384 case rs_align_code:
1385 break;
e379e5f3
L
1386 case rs_machine_dependent:
1387 /* Allow NOP padding for jumps and calls. */
1388 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1389 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1390 break;
1391 /* Fall through. */
3ae729d5 1392 default:
62a02d25
L
1393 return;
1394 }
1395
ccc9c027
L
1396 /* We need to decide which NOP sequence to use for 32bit and
1397 64bit. When -mtune= is used:
4eed87de 1398
76bc74dc
L
1399 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1400 PROCESSOR_GENERIC32, f32_patt will be used.
80b8656c
L
1401 2. For the rest, alt_patt will be used.
1402
1403 When -mtune= isn't used, alt_patt will be used if
22109423 1404 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
76bc74dc 1405 be used.
ccc9c027
L
1406
1407 When -march= or .arch is used, we can't use anything beyond
1408 cpu_arch_isa_flags. */
1409
1410 if (flag_code == CODE_16BIT)
1411 {
3ae729d5
L
1412 patt = f16_patt;
1413 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1414 /* Limit number of NOPs to 2 in 16-bit mode. */
1415 max_number_of_nops = 2;
252b5132 1416 }
33fef721 1417 else
ccc9c027 1418 {
fbf3f584 1419 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
ccc9c027
L
1420 {
1421 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1422 switch (cpu_arch_tune)
1423 {
1424 case PROCESSOR_UNKNOWN:
1425 /* We use cpu_arch_isa_flags to check if we SHOULD
22109423
L
1426 optimize with nops. */
1427 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1428 patt = alt_patt;
ccc9c027
L
1429 else
1430 patt = f32_patt;
1431 break;
ccc9c027
L
1432 case PROCESSOR_PENTIUM4:
1433 case PROCESSOR_NOCONA:
ef05d495 1434 case PROCESSOR_CORE:
76bc74dc 1435 case PROCESSOR_CORE2:
bd5295b2 1436 case PROCESSOR_COREI7:
76bc74dc 1437 case PROCESSOR_GENERIC64:
ccc9c027
L
1438 case PROCESSOR_K6:
1439 case PROCESSOR_ATHLON:
1440 case PROCESSOR_K8:
4eed87de 1441 case PROCESSOR_AMDFAM10:
8aedb9fe 1442 case PROCESSOR_BD:
029f3522 1443 case PROCESSOR_ZNVER:
7b458c12 1444 case PROCESSOR_BT:
80b8656c 1445 patt = alt_patt;
ccc9c027 1446 break;
76bc74dc 1447 case PROCESSOR_I386:
ccc9c027
L
1448 case PROCESSOR_I486:
1449 case PROCESSOR_PENTIUM:
2dde1948 1450 case PROCESSOR_PENTIUMPRO:
81486035 1451 case PROCESSOR_IAMCU:
ccc9c027
L
1452 case PROCESSOR_GENERIC32:
1453 patt = f32_patt;
1454 break;
c368d2a8
JB
1455 case PROCESSOR_NONE:
1456 abort ();
4eed87de 1457 }
ccc9c027
L
1458 }
1459 else
1460 {
fbf3f584 1461 switch (fragP->tc_frag_data.tune)
ccc9c027
L
1462 {
1463 case PROCESSOR_UNKNOWN:
e6a14101 1464 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
ccc9c027
L
1465 PROCESSOR_UNKNOWN. */
1466 abort ();
1467 break;
1468
76bc74dc 1469 case PROCESSOR_I386:
ccc9c027
L
1470 case PROCESSOR_I486:
1471 case PROCESSOR_PENTIUM:
81486035 1472 case PROCESSOR_IAMCU:
ccc9c027
L
1473 case PROCESSOR_K6:
1474 case PROCESSOR_ATHLON:
1475 case PROCESSOR_K8:
4eed87de 1476 case PROCESSOR_AMDFAM10:
8aedb9fe 1477 case PROCESSOR_BD:
029f3522 1478 case PROCESSOR_ZNVER:
7b458c12 1479 case PROCESSOR_BT:
ccc9c027
L
1480 case PROCESSOR_GENERIC32:
1481 /* We use cpu_arch_isa_flags to check if we CAN optimize
22109423
L
1482 with nops. */
1483 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1484 patt = alt_patt;
ccc9c027
L
1485 else
1486 patt = f32_patt;
1487 break;
76bc74dc
L
1488 case PROCESSOR_PENTIUMPRO:
1489 case PROCESSOR_PENTIUM4:
1490 case PROCESSOR_NOCONA:
1491 case PROCESSOR_CORE:
ef05d495 1492 case PROCESSOR_CORE2:
bd5295b2 1493 case PROCESSOR_COREI7:
22109423 1494 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1495 patt = alt_patt;
ccc9c027
L
1496 else
1497 patt = f32_patt;
1498 break;
1499 case PROCESSOR_GENERIC64:
80b8656c 1500 patt = alt_patt;
ccc9c027 1501 break;
c368d2a8
JB
1502 case PROCESSOR_NONE:
1503 abort ();
4eed87de 1504 }
ccc9c027
L
1505 }
1506
76bc74dc
L
1507 if (patt == f32_patt)
1508 {
3ae729d5
L
1509 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1510 /* Limit number of NOPs to 2 for older processors. */
1511 max_number_of_nops = 2;
76bc74dc
L
1512 }
1513 else
1514 {
3ae729d5
L
1515 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1516 /* Limit number of NOPs to 7 for newer processors. */
1517 max_number_of_nops = 7;
1518 }
1519 }
1520
1521 if (limit == 0)
1522 limit = max_single_nop_size;
1523
1524 if (fragP->fr_type == rs_fill_nop)
1525 {
1526 /* Output NOPs for .nop directive. */
1527 if (limit > max_single_nop_size)
1528 {
1529 as_bad_where (fragP->fr_file, fragP->fr_line,
1530 _("invalid single nop size: %d "
1531 "(expect within [0, %d])"),
1532 limit, max_single_nop_size);
1533 return;
1534 }
1535 }
e379e5f3 1536 else if (fragP->fr_type != rs_machine_dependent)
3ae729d5
L
1537 fragP->fr_var = count;
1538
1539 if ((count / max_single_nop_size) > max_number_of_nops)
1540 {
1541 /* Generate jump over NOPs. */
1542 offsetT disp = count - 2;
1543 if (fits_in_imm7 (disp))
1544 {
1545 /* Use "jmp disp8" if possible. */
1546 count = disp;
1547 where[0] = jump_disp8[0];
1548 where[1] = count;
1549 where += 2;
1550 }
1551 else
1552 {
1553 unsigned int size_of_jump;
1554
1555 if (flag_code == CODE_16BIT)
1556 {
1557 where[0] = jump16_disp32[0];
1558 where[1] = jump16_disp32[1];
1559 size_of_jump = 2;
1560 }
1561 else
1562 {
1563 where[0] = jump32_disp32[0];
1564 size_of_jump = 1;
1565 }
1566
1567 count -= size_of_jump + 4;
1568 if (!fits_in_imm31 (count))
1569 {
1570 as_bad_where (fragP->fr_file, fragP->fr_line,
1571 _("jump over nop padding out of range"));
1572 return;
1573 }
1574
1575 md_number_to_chars (where + size_of_jump, count, 4);
1576 where += size_of_jump + 4;
76bc74dc 1577 }
ccc9c027 1578 }
3ae729d5
L
1579
1580 /* Generate multiple NOPs. */
1581 i386_output_nops (where, patt, count, limit);
252b5132
RH
1582}
1583
c6fb90c8 1584static INLINE int
0dfbf9d7 1585operand_type_all_zero (const union i386_operand_type *x)
40fb9820 1586{
0dfbf9d7 1587 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1588 {
1589 case 3:
0dfbf9d7 1590 if (x->array[2])
c6fb90c8 1591 return 0;
1a0670f3 1592 /* Fall through. */
c6fb90c8 1593 case 2:
0dfbf9d7 1594 if (x->array[1])
c6fb90c8 1595 return 0;
1a0670f3 1596 /* Fall through. */
c6fb90c8 1597 case 1:
0dfbf9d7 1598 return !x->array[0];
c6fb90c8
L
1599 default:
1600 abort ();
1601 }
40fb9820
L
1602}
1603
c6fb90c8 1604static INLINE void
0dfbf9d7 1605operand_type_set (union i386_operand_type *x, unsigned int v)
40fb9820 1606{
0dfbf9d7 1607 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1608 {
1609 case 3:
0dfbf9d7 1610 x->array[2] = v;
1a0670f3 1611 /* Fall through. */
c6fb90c8 1612 case 2:
0dfbf9d7 1613 x->array[1] = v;
1a0670f3 1614 /* Fall through. */
c6fb90c8 1615 case 1:
0dfbf9d7 1616 x->array[0] = v;
1a0670f3 1617 /* Fall through. */
c6fb90c8
L
1618 break;
1619 default:
1620 abort ();
1621 }
bab6aec1
JB
1622
1623 x->bitfield.class = ClassNone;
75e5731b 1624 x->bitfield.instance = InstanceNone;
c6fb90c8 1625}
40fb9820 1626
c6fb90c8 1627static INLINE int
0dfbf9d7
L
1628operand_type_equal (const union i386_operand_type *x,
1629 const union i386_operand_type *y)
c6fb90c8 1630{
0dfbf9d7 1631 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1632 {
1633 case 3:
0dfbf9d7 1634 if (x->array[2] != y->array[2])
c6fb90c8 1635 return 0;
1a0670f3 1636 /* Fall through. */
c6fb90c8 1637 case 2:
0dfbf9d7 1638 if (x->array[1] != y->array[1])
c6fb90c8 1639 return 0;
1a0670f3 1640 /* Fall through. */
c6fb90c8 1641 case 1:
0dfbf9d7 1642 return x->array[0] == y->array[0];
c6fb90c8
L
1643 break;
1644 default:
1645 abort ();
1646 }
1647}
40fb9820 1648
0dfbf9d7
L
1649static INLINE int
1650cpu_flags_all_zero (const union i386_cpu_flags *x)
1651{
1652 switch (ARRAY_SIZE(x->array))
1653 {
75f8266a
KL
1654 case 5:
1655 if (x->array[4])
1656 return 0;
1657 /* Fall through. */
53467f57
IT
1658 case 4:
1659 if (x->array[3])
1660 return 0;
1661 /* Fall through. */
0dfbf9d7
L
1662 case 3:
1663 if (x->array[2])
1664 return 0;
1a0670f3 1665 /* Fall through. */
0dfbf9d7
L
1666 case 2:
1667 if (x->array[1])
1668 return 0;
1a0670f3 1669 /* Fall through. */
0dfbf9d7
L
1670 case 1:
1671 return !x->array[0];
1672 default:
1673 abort ();
1674 }
1675}
1676
0dfbf9d7
L
1677static INLINE int
1678cpu_flags_equal (const union i386_cpu_flags *x,
1679 const union i386_cpu_flags *y)
1680{
1681 switch (ARRAY_SIZE(x->array))
1682 {
75f8266a
KL
1683 case 5:
1684 if (x->array[4] != y->array[4])
1685 return 0;
1686 /* Fall through. */
53467f57
IT
1687 case 4:
1688 if (x->array[3] != y->array[3])
1689 return 0;
1690 /* Fall through. */
0dfbf9d7
L
1691 case 3:
1692 if (x->array[2] != y->array[2])
1693 return 0;
1a0670f3 1694 /* Fall through. */
0dfbf9d7
L
1695 case 2:
1696 if (x->array[1] != y->array[1])
1697 return 0;
1a0670f3 1698 /* Fall through. */
0dfbf9d7
L
1699 case 1:
1700 return x->array[0] == y->array[0];
1701 break;
1702 default:
1703 abort ();
1704 }
1705}
c6fb90c8
L
1706
1707static INLINE int
1708cpu_flags_check_cpu64 (i386_cpu_flags f)
1709{
1710 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1711 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
40fb9820
L
1712}
1713
c6fb90c8
L
1714static INLINE i386_cpu_flags
1715cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1716{
c6fb90c8
L
1717 switch (ARRAY_SIZE (x.array))
1718 {
75f8266a
KL
1719 case 5:
1720 x.array [4] &= y.array [4];
1721 /* Fall through. */
53467f57
IT
1722 case 4:
1723 x.array [3] &= y.array [3];
1724 /* Fall through. */
c6fb90c8
L
1725 case 3:
1726 x.array [2] &= y.array [2];
1a0670f3 1727 /* Fall through. */
c6fb90c8
L
1728 case 2:
1729 x.array [1] &= y.array [1];
1a0670f3 1730 /* Fall through. */
c6fb90c8
L
1731 case 1:
1732 x.array [0] &= y.array [0];
1733 break;
1734 default:
1735 abort ();
1736 }
1737 return x;
1738}
40fb9820 1739
c6fb90c8
L
1740static INLINE i386_cpu_flags
1741cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1742{
c6fb90c8 1743 switch (ARRAY_SIZE (x.array))
40fb9820 1744 {
75f8266a
KL
1745 case 5:
1746 x.array [4] |= y.array [4];
1747 /* Fall through. */
53467f57
IT
1748 case 4:
1749 x.array [3] |= y.array [3];
1750 /* Fall through. */
c6fb90c8
L
1751 case 3:
1752 x.array [2] |= y.array [2];
1a0670f3 1753 /* Fall through. */
c6fb90c8
L
1754 case 2:
1755 x.array [1] |= y.array [1];
1a0670f3 1756 /* Fall through. */
c6fb90c8
L
1757 case 1:
1758 x.array [0] |= y.array [0];
40fb9820
L
1759 break;
1760 default:
1761 abort ();
1762 }
40fb9820
L
1763 return x;
1764}
1765
309d3373
JB
1766static INLINE i386_cpu_flags
1767cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1768{
1769 switch (ARRAY_SIZE (x.array))
1770 {
75f8266a
KL
1771 case 5:
1772 x.array [4] &= ~y.array [4];
1773 /* Fall through. */
53467f57
IT
1774 case 4:
1775 x.array [3] &= ~y.array [3];
1776 /* Fall through. */
309d3373
JB
1777 case 3:
1778 x.array [2] &= ~y.array [2];
1a0670f3 1779 /* Fall through. */
309d3373
JB
1780 case 2:
1781 x.array [1] &= ~y.array [1];
1a0670f3 1782 /* Fall through. */
309d3373
JB
1783 case 1:
1784 x.array [0] &= ~y.array [0];
1785 break;
1786 default:
1787 abort ();
1788 }
1789 return x;
1790}
1791
6c0946d0
JB
1792static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1793
c0f3af97
L
1794#define CPU_FLAGS_ARCH_MATCH 0x1
1795#define CPU_FLAGS_64BIT_MATCH 0x2
1796
c0f3af97 1797#define CPU_FLAGS_PERFECT_MATCH \
db12e14e 1798 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
c0f3af97
L
1799
1800/* Return CPU flags match bits. */
3629bb00 1801
40fb9820 1802static int
d3ce72d0 1803cpu_flags_match (const insn_template *t)
40fb9820 1804{
c0f3af97
L
1805 i386_cpu_flags x = t->cpu_flags;
1806 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
40fb9820
L
1807
1808 x.bitfield.cpu64 = 0;
1809 x.bitfield.cpuno64 = 0;
1810
0dfbf9d7 1811 if (cpu_flags_all_zero (&x))
c0f3af97
L
1812 {
1813 /* This instruction is available on all archs. */
db12e14e 1814 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1815 }
3629bb00
L
1816 else
1817 {
c0f3af97 1818 /* This instruction is available only on some archs. */
3629bb00
L
1819 i386_cpu_flags cpu = cpu_arch_flags;
1820
ab592e75
JB
1821 /* AVX512VL is no standalone feature - match it and then strip it. */
1822 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1823 return match;
1824 x.bitfield.cpuavx512vl = 0;
1825
22c36940
JB
1826 /* AVX and AVX2 present at the same time express an operand size
1827 dependency - strip AVX2 for the purposes here. The operand size
1828 dependent check occurs in check_vecOperands(). */
1829 if (x.bitfield.cpuavx && x.bitfield.cpuavx2)
1830 x.bitfield.cpuavx2 = 0;
1831
3629bb00 1832 cpu = cpu_flags_and (x, cpu);
c0f3af97
L
1833 if (!cpu_flags_all_zero (&cpu))
1834 {
57392598 1835 if (x.bitfield.cpuavx)
a5ff0eb2 1836 {
929f69fa 1837 /* We need to check a few extra flags with AVX. */
b9d49817 1838 if (cpu.bitfield.cpuavx
40d231b4
JB
1839 && (!t->opcode_modifier.sse2avx
1840 || (sse2avx && !i.prefix[DATA_PREFIX]))
b9d49817 1841 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
929f69fa 1842 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
b9d49817
JB
1843 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1844 match |= CPU_FLAGS_ARCH_MATCH;
a5ff0eb2 1845 }
929f69fa
JB
1846 else if (x.bitfield.cpuavx512f)
1847 {
1848 /* We need to check a few extra flags with AVX512F. */
1849 if (cpu.bitfield.cpuavx512f
1850 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1851 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1852 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1853 match |= CPU_FLAGS_ARCH_MATCH;
1854 }
a5ff0eb2 1855 else
db12e14e 1856 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1857 }
3629bb00 1858 }
c0f3af97 1859 return match;
40fb9820
L
1860}
1861
c6fb90c8
L
1862static INLINE i386_operand_type
1863operand_type_and (i386_operand_type x, i386_operand_type y)
40fb9820 1864{
bab6aec1
JB
1865 if (x.bitfield.class != y.bitfield.class)
1866 x.bitfield.class = ClassNone;
75e5731b
JB
1867 if (x.bitfield.instance != y.bitfield.instance)
1868 x.bitfield.instance = InstanceNone;
bab6aec1 1869
c6fb90c8
L
1870 switch (ARRAY_SIZE (x.array))
1871 {
1872 case 3:
1873 x.array [2] &= y.array [2];
1a0670f3 1874 /* Fall through. */
c6fb90c8
L
1875 case 2:
1876 x.array [1] &= y.array [1];
1a0670f3 1877 /* Fall through. */
c6fb90c8
L
1878 case 1:
1879 x.array [0] &= y.array [0];
1880 break;
1881 default:
1882 abort ();
1883 }
1884 return x;
40fb9820
L
1885}
1886
73053c1f
JB
1887static INLINE i386_operand_type
1888operand_type_and_not (i386_operand_type x, i386_operand_type y)
1889{
bab6aec1 1890 gas_assert (y.bitfield.class == ClassNone);
75e5731b 1891 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 1892
73053c1f
JB
1893 switch (ARRAY_SIZE (x.array))
1894 {
1895 case 3:
1896 x.array [2] &= ~y.array [2];
1897 /* Fall through. */
1898 case 2:
1899 x.array [1] &= ~y.array [1];
1900 /* Fall through. */
1901 case 1:
1902 x.array [0] &= ~y.array [0];
1903 break;
1904 default:
1905 abort ();
1906 }
1907 return x;
1908}
1909
c6fb90c8
L
1910static INLINE i386_operand_type
1911operand_type_or (i386_operand_type x, i386_operand_type y)
40fb9820 1912{
bab6aec1
JB
1913 gas_assert (x.bitfield.class == ClassNone ||
1914 y.bitfield.class == ClassNone ||
1915 x.bitfield.class == y.bitfield.class);
75e5731b
JB
1916 gas_assert (x.bitfield.instance == InstanceNone ||
1917 y.bitfield.instance == InstanceNone ||
1918 x.bitfield.instance == y.bitfield.instance);
bab6aec1 1919
c6fb90c8 1920 switch (ARRAY_SIZE (x.array))
40fb9820 1921 {
c6fb90c8
L
1922 case 3:
1923 x.array [2] |= y.array [2];
1a0670f3 1924 /* Fall through. */
c6fb90c8
L
1925 case 2:
1926 x.array [1] |= y.array [1];
1a0670f3 1927 /* Fall through. */
c6fb90c8
L
1928 case 1:
1929 x.array [0] |= y.array [0];
40fb9820
L
1930 break;
1931 default:
1932 abort ();
1933 }
c6fb90c8
L
1934 return x;
1935}
40fb9820 1936
c6fb90c8
L
1937static INLINE i386_operand_type
1938operand_type_xor (i386_operand_type x, i386_operand_type y)
1939{
bab6aec1 1940 gas_assert (y.bitfield.class == ClassNone);
75e5731b 1941 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 1942
c6fb90c8
L
1943 switch (ARRAY_SIZE (x.array))
1944 {
1945 case 3:
1946 x.array [2] ^= y.array [2];
1a0670f3 1947 /* Fall through. */
c6fb90c8
L
1948 case 2:
1949 x.array [1] ^= y.array [1];
1a0670f3 1950 /* Fall through. */
c6fb90c8
L
1951 case 1:
1952 x.array [0] ^= y.array [0];
1953 break;
1954 default:
1955 abort ();
1956 }
40fb9820
L
1957 return x;
1958}
1959
05909f23
JB
1960static const i386_operand_type anydisp = {
1961 .bitfield = { .disp8 = 1, .disp16 = 1, .disp32 = 1, .disp64 = 1 }
1962};
40fb9820
L
1963
1964enum operand_type
1965{
1966 reg,
40fb9820
L
1967 imm,
1968 disp,
1969 anymem
1970};
1971
c6fb90c8 1972static INLINE int
40fb9820
L
1973operand_type_check (i386_operand_type t, enum operand_type c)
1974{
1975 switch (c)
1976 {
1977 case reg:
bab6aec1 1978 return t.bitfield.class == Reg;
40fb9820 1979
40fb9820
L
1980 case imm:
1981 return (t.bitfield.imm8
1982 || t.bitfield.imm8s
1983 || t.bitfield.imm16
1984 || t.bitfield.imm32
1985 || t.bitfield.imm32s
1986 || t.bitfield.imm64);
1987
1988 case disp:
1989 return (t.bitfield.disp8
1990 || t.bitfield.disp16
1991 || t.bitfield.disp32
40fb9820
L
1992 || t.bitfield.disp64);
1993
1994 case anymem:
1995 return (t.bitfield.disp8
1996 || t.bitfield.disp16
1997 || t.bitfield.disp32
40fb9820
L
1998 || t.bitfield.disp64
1999 || t.bitfield.baseindex);
2000
2001 default:
2002 abort ();
2003 }
2cfe26b6
AM
2004
2005 return 0;
40fb9820
L
2006}
2007
7a54636a
L
2008/* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2009 between operand GIVEN and opeand WANTED for instruction template T. */
5c07affc
L
2010
2011static INLINE int
7a54636a
L
2012match_operand_size (const insn_template *t, unsigned int wanted,
2013 unsigned int given)
5c07affc 2014{
3ac21baa
JB
2015 return !((i.types[given].bitfield.byte
2016 && !t->operand_types[wanted].bitfield.byte)
2017 || (i.types[given].bitfield.word
2018 && !t->operand_types[wanted].bitfield.word)
2019 || (i.types[given].bitfield.dword
2020 && !t->operand_types[wanted].bitfield.dword)
2021 || (i.types[given].bitfield.qword
9db83a32
JB
2022 && (!t->operand_types[wanted].bitfield.qword
2023 /* Don't allow 64-bit (memory) operands outside of 64-bit
2024 mode, when they're used where a 64-bit GPR could also
2025 be used. Checking is needed for Intel Syntax only. */
2026 || (intel_syntax
2027 && flag_code != CODE_64BIT
2028 && (t->operand_types[wanted].bitfield.class == Reg
2029 || t->operand_types[wanted].bitfield.class == Accum
2030 || t->opcode_modifier.isstring))))
3ac21baa
JB
2031 || (i.types[given].bitfield.tbyte
2032 && !t->operand_types[wanted].bitfield.tbyte));
5c07affc
L
2033}
2034
dd40ce22
L
2035/* Return 1 if there is no conflict in SIMD register between operand
2036 GIVEN and opeand WANTED for instruction template T. */
1b54b8d7
JB
2037
2038static INLINE int
dd40ce22
L
2039match_simd_size (const insn_template *t, unsigned int wanted,
2040 unsigned int given)
1b54b8d7 2041{
3ac21baa
JB
2042 return !((i.types[given].bitfield.xmmword
2043 && !t->operand_types[wanted].bitfield.xmmword)
2044 || (i.types[given].bitfield.ymmword
2045 && !t->operand_types[wanted].bitfield.ymmword)
2046 || (i.types[given].bitfield.zmmword
260cd341
LC
2047 && !t->operand_types[wanted].bitfield.zmmword)
2048 || (i.types[given].bitfield.tmmword
2049 && !t->operand_types[wanted].bitfield.tmmword));
1b54b8d7
JB
2050}
2051
7a54636a
L
2052/* Return 1 if there is no conflict in any size between operand GIVEN
2053 and opeand WANTED for instruction template T. */
5c07affc
L
2054
2055static INLINE int
dd40ce22
L
2056match_mem_size (const insn_template *t, unsigned int wanted,
2057 unsigned int given)
5c07affc 2058{
7a54636a 2059 return (match_operand_size (t, wanted, given)
3ac21baa 2060 && !((i.types[given].bitfield.unspecified
5273a3cd 2061 && !i.broadcast.type
a5748e0d 2062 && !i.broadcast.bytes
3ac21baa
JB
2063 && !t->operand_types[wanted].bitfield.unspecified)
2064 || (i.types[given].bitfield.fword
2065 && !t->operand_types[wanted].bitfield.fword)
1b54b8d7
JB
2066 /* For scalar opcode templates to allow register and memory
2067 operands at the same time, some special casing is needed
d6793fa1
JB
2068 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2069 down-conversion vpmov*. */
3528c362 2070 || ((t->operand_types[wanted].bitfield.class == RegSIMD
bc49bfd8
JB
2071 && t->operand_types[wanted].bitfield.byte
2072 + t->operand_types[wanted].bitfield.word
2073 + t->operand_types[wanted].bitfield.dword
2074 + t->operand_types[wanted].bitfield.qword
2075 > !!t->opcode_modifier.broadcast)
3ac21baa
JB
2076 ? (i.types[given].bitfield.xmmword
2077 || i.types[given].bitfield.ymmword
2078 || i.types[given].bitfield.zmmword)
2079 : !match_simd_size(t, wanted, given))));
5c07affc
L
2080}
2081
3ac21baa
JB
2082/* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2083 operands for instruction template T, and it has MATCH_REVERSE set if there
2084 is no size conflict on any operands for the template with operands reversed
2085 (and the template allows for reversing in the first place). */
5c07affc 2086
3ac21baa
JB
2087#define MATCH_STRAIGHT 1
2088#define MATCH_REVERSE 2
2089
2090static INLINE unsigned int
d3ce72d0 2091operand_size_match (const insn_template *t)
5c07affc 2092{
3ac21baa 2093 unsigned int j, match = MATCH_STRAIGHT;
5c07affc 2094
0cfa3eb3 2095 /* Don't check non-absolute jump instructions. */
5c07affc 2096 if (t->opcode_modifier.jump
0cfa3eb3 2097 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5c07affc
L
2098 return match;
2099
2100 /* Check memory and accumulator operand size. */
2101 for (j = 0; j < i.operands; j++)
2102 {
3528c362
JB
2103 if (i.types[j].bitfield.class != Reg
2104 && i.types[j].bitfield.class != RegSIMD
255571cd 2105 && t->opcode_modifier.operandconstraint == ANY_SIZE)
5c07affc
L
2106 continue;
2107
bab6aec1 2108 if (t->operand_types[j].bitfield.class == Reg
7a54636a 2109 && !match_operand_size (t, j, j))
5c07affc
L
2110 {
2111 match = 0;
2112 break;
2113 }
2114
3528c362 2115 if (t->operand_types[j].bitfield.class == RegSIMD
3ac21baa 2116 && !match_simd_size (t, j, j))
1b54b8d7
JB
2117 {
2118 match = 0;
2119 break;
2120 }
2121
75e5731b 2122 if (t->operand_types[j].bitfield.instance == Accum
7a54636a 2123 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
1b54b8d7
JB
2124 {
2125 match = 0;
2126 break;
2127 }
2128
c48dadc9 2129 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
5c07affc
L
2130 {
2131 match = 0;
2132 break;
2133 }
2134 }
2135
3ac21baa 2136 if (!t->opcode_modifier.d)
7b94647a 2137 return match;
5c07affc
L
2138
2139 /* Check reverse. */
aa180741 2140 gas_assert (i.operands >= 2);
5c07affc 2141
f5eb1d70 2142 for (j = 0; j < i.operands; j++)
5c07affc 2143 {
f5eb1d70
JB
2144 unsigned int given = i.operands - j - 1;
2145
aa180741 2146 /* For FMA4 and XOP insns VEX.W controls just the first two
8bd915b7 2147 register operands. */
aa180741 2148 if (t->cpu_flags.bitfield.cpufma4 || t->cpu_flags.bitfield.cpuxop)
8bd915b7
JB
2149 given = j < 2 ? 1 - j : j;
2150
bab6aec1 2151 if (t->operand_types[j].bitfield.class == Reg
f5eb1d70 2152 && !match_operand_size (t, j, given))
7b94647a 2153 return match;
5c07affc 2154
3528c362 2155 if (t->operand_types[j].bitfield.class == RegSIMD
f5eb1d70 2156 && !match_simd_size (t, j, given))
7b94647a 2157 return match;
dbbc8b7e 2158
75e5731b 2159 if (t->operand_types[j].bitfield.instance == Accum
f5eb1d70
JB
2160 && (!match_operand_size (t, j, given)
2161 || !match_simd_size (t, j, given)))
7b94647a 2162 return match;
dbbc8b7e 2163
f5eb1d70 2164 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
7b94647a 2165 return match;
5c07affc
L
2166 }
2167
3ac21baa 2168 return match | MATCH_REVERSE;
5c07affc
L
2169}
2170
c6fb90c8 2171static INLINE int
40fb9820
L
2172operand_type_match (i386_operand_type overlap,
2173 i386_operand_type given)
2174{
2175 i386_operand_type temp = overlap;
2176
7d5e4556 2177 temp.bitfield.unspecified = 0;
5c07affc
L
2178 temp.bitfield.byte = 0;
2179 temp.bitfield.word = 0;
2180 temp.bitfield.dword = 0;
2181 temp.bitfield.fword = 0;
2182 temp.bitfield.qword = 0;
2183 temp.bitfield.tbyte = 0;
2184 temp.bitfield.xmmword = 0;
c0f3af97 2185 temp.bitfield.ymmword = 0;
43234a1e 2186 temp.bitfield.zmmword = 0;
260cd341 2187 temp.bitfield.tmmword = 0;
0dfbf9d7 2188 if (operand_type_all_zero (&temp))
891edac4 2189 goto mismatch;
40fb9820 2190
6f2f06be 2191 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
891edac4
L
2192 return 1;
2193
dc1e8a47 2194 mismatch:
a65babc9 2195 i.error = operand_type_mismatch;
891edac4 2196 return 0;
40fb9820
L
2197}
2198
7d5e4556 2199/* If given types g0 and g1 are registers they must be of the same type
10c17abd 2200 unless the expected operand type register overlap is null.
8ee52bcf 2201 Intel syntax sized memory operands are also checked here. */
40fb9820 2202
c6fb90c8 2203static INLINE int
dc821c5f 2204operand_type_register_match (i386_operand_type g0,
40fb9820 2205 i386_operand_type t0,
40fb9820
L
2206 i386_operand_type g1,
2207 i386_operand_type t1)
2208{
bab6aec1 2209 if (g0.bitfield.class != Reg
3528c362 2210 && g0.bitfield.class != RegSIMD
8ee52bcf
JB
2211 && (g0.bitfield.unspecified
2212 || !operand_type_check (g0, anymem)))
40fb9820
L
2213 return 1;
2214
bab6aec1 2215 if (g1.bitfield.class != Reg
3528c362 2216 && g1.bitfield.class != RegSIMD
8ee52bcf
JB
2217 && (g1.bitfield.unspecified
2218 || !operand_type_check (g1, anymem)))
40fb9820
L
2219 return 1;
2220
dc821c5f
JB
2221 if (g0.bitfield.byte == g1.bitfield.byte
2222 && g0.bitfield.word == g1.bitfield.word
2223 && g0.bitfield.dword == g1.bitfield.dword
10c17abd
JB
2224 && g0.bitfield.qword == g1.bitfield.qword
2225 && g0.bitfield.xmmword == g1.bitfield.xmmword
2226 && g0.bitfield.ymmword == g1.bitfield.ymmword
2227 && g0.bitfield.zmmword == g1.bitfield.zmmword)
40fb9820
L
2228 return 1;
2229
c4d09633
JB
2230 /* If expectations overlap in no more than a single size, all is fine. */
2231 g0 = operand_type_and (t0, t1);
2232 if (g0.bitfield.byte
2233 + g0.bitfield.word
2234 + g0.bitfield.dword
2235 + g0.bitfield.qword
2236 + g0.bitfield.xmmword
2237 + g0.bitfield.ymmword
2238 + g0.bitfield.zmmword <= 1)
891edac4
L
2239 return 1;
2240
a65babc9 2241 i.error = register_type_mismatch;
891edac4
L
2242
2243 return 0;
40fb9820
L
2244}
2245
4c692bc7
JB
2246static INLINE unsigned int
2247register_number (const reg_entry *r)
2248{
2249 unsigned int nr = r->reg_num;
2250
2251 if (r->reg_flags & RegRex)
2252 nr += 8;
2253
200cbe0f
L
2254 if (r->reg_flags & RegVRex)
2255 nr += 16;
2256
4c692bc7
JB
2257 return nr;
2258}
2259
252b5132 2260static INLINE unsigned int
40fb9820 2261mode_from_disp_size (i386_operand_type t)
252b5132 2262{
b5014f7a 2263 if (t.bitfield.disp8)
40fb9820
L
2264 return 1;
2265 else if (t.bitfield.disp16
a775efc8 2266 || t.bitfield.disp32)
40fb9820
L
2267 return 2;
2268 else
2269 return 0;
252b5132
RH
2270}
2271
2272static INLINE int
65879393 2273fits_in_signed_byte (addressT num)
252b5132 2274{
65879393 2275 return num + 0x80 <= 0xff;
47926f60 2276}
252b5132
RH
2277
2278static INLINE int
65879393 2279fits_in_unsigned_byte (addressT num)
252b5132 2280{
65879393 2281 return num <= 0xff;
47926f60 2282}
252b5132
RH
2283
2284static INLINE int
65879393 2285fits_in_unsigned_word (addressT num)
252b5132 2286{
65879393 2287 return num <= 0xffff;
47926f60 2288}
252b5132
RH
2289
2290static INLINE int
65879393 2291fits_in_signed_word (addressT num)
252b5132 2292{
65879393 2293 return num + 0x8000 <= 0xffff;
47926f60 2294}
2a962e6d 2295
3e73aa7c 2296static INLINE int
65879393 2297fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2298{
2299#ifndef BFD64
2300 return 1;
2301#else
65879393 2302 return num + 0x80000000 <= 0xffffffff;
3e73aa7c
JH
2303#endif
2304} /* fits_in_signed_long() */
2a962e6d 2305
3e73aa7c 2306static INLINE int
65879393 2307fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2308{
2309#ifndef BFD64
2310 return 1;
2311#else
65879393 2312 return num <= 0xffffffff;
3e73aa7c
JH
2313#endif
2314} /* fits_in_unsigned_long() */
252b5132 2315
a442cac5
JB
2316static INLINE valueT extend_to_32bit_address (addressT num)
2317{
2318#ifdef BFD64
2319 if (fits_in_unsigned_long(num))
2320 return (num ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2321
2322 if (!fits_in_signed_long (num))
2323 return num & 0xffffffff;
2324#endif
2325
2326 return num;
2327}
2328
43234a1e 2329static INLINE int
b5014f7a 2330fits_in_disp8 (offsetT num)
43234a1e
L
2331{
2332 int shift = i.memshift;
2333 unsigned int mask;
2334
2335 if (shift == -1)
2336 abort ();
2337
2338 mask = (1 << shift) - 1;
2339
2340 /* Return 0 if NUM isn't properly aligned. */
2341 if ((num & mask))
2342 return 0;
2343
2344 /* Check if NUM will fit in 8bit after shift. */
2345 return fits_in_signed_byte (num >> shift);
2346}
2347
a683cc34
SP
2348static INLINE int
2349fits_in_imm4 (offsetT num)
2350{
2351 return (num & 0xf) == num;
2352}
2353
40fb9820 2354static i386_operand_type
e3bb37b5 2355smallest_imm_type (offsetT num)
252b5132 2356{
40fb9820 2357 i386_operand_type t;
7ab9ffdd 2358
0dfbf9d7 2359 operand_type_set (&t, 0);
40fb9820
L
2360 t.bitfield.imm64 = 1;
2361
2362 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
e413e4e9
AM
2363 {
2364 /* This code is disabled on the 486 because all the Imm1 forms
2365 in the opcode table are slower on the i486. They're the
2366 versions with the implicitly specified single-position
2367 displacement, which has another syntax if you really want to
2368 use that form. */
40fb9820
L
2369 t.bitfield.imm1 = 1;
2370 t.bitfield.imm8 = 1;
2371 t.bitfield.imm8s = 1;
2372 t.bitfield.imm16 = 1;
2373 t.bitfield.imm32 = 1;
2374 t.bitfield.imm32s = 1;
2375 }
2376 else if (fits_in_signed_byte (num))
2377 {
c34d1cc9
JB
2378 if (fits_in_unsigned_byte (num))
2379 t.bitfield.imm8 = 1;
40fb9820
L
2380 t.bitfield.imm8s = 1;
2381 t.bitfield.imm16 = 1;
2382 t.bitfield.imm32 = 1;
2383 t.bitfield.imm32s = 1;
2384 }
2385 else if (fits_in_unsigned_byte (num))
2386 {
2387 t.bitfield.imm8 = 1;
2388 t.bitfield.imm16 = 1;
2389 t.bitfield.imm32 = 1;
2390 t.bitfield.imm32s = 1;
2391 }
2392 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2393 {
2394 t.bitfield.imm16 = 1;
2395 t.bitfield.imm32 = 1;
2396 t.bitfield.imm32s = 1;
2397 }
2398 else if (fits_in_signed_long (num))
2399 {
2400 t.bitfield.imm32 = 1;
2401 t.bitfield.imm32s = 1;
2402 }
2403 else if (fits_in_unsigned_long (num))
2404 t.bitfield.imm32 = 1;
2405
2406 return t;
47926f60 2407}
252b5132 2408
847f7ad4 2409static offsetT
e3bb37b5 2410offset_in_range (offsetT val, int size)
847f7ad4 2411{
508866be 2412 addressT mask;
ba2adb93 2413
847f7ad4
AM
2414 switch (size)
2415 {
508866be
L
2416 case 1: mask = ((addressT) 1 << 8) - 1; break;
2417 case 2: mask = ((addressT) 1 << 16) - 1; break;
3e73aa7c 2418#ifdef BFD64
64965897 2419 case 4: mask = ((addressT) 1 << 32) - 1; break;
3e73aa7c 2420#endif
64965897 2421 case sizeof (val): return val;
47926f60 2422 default: abort ();
847f7ad4
AM
2423 }
2424
4fe51f7d 2425 if ((val & ~mask) != 0 && (-val & ~mask) != 0)
f493c217
AM
2426 as_warn (_("0x%" PRIx64 " shortened to 0x%" PRIx64),
2427 (uint64_t) val, (uint64_t) (val & mask));
847f7ad4 2428
847f7ad4
AM
2429 return val & mask;
2430}
2431
76d3f746
JB
2432static INLINE const char *insn_name (const insn_template *t)
2433{
5c139202 2434 return &i386_mnemonics[t->mnem_off];
76d3f746
JB
2435}
2436
c32fa91d
L
2437enum PREFIX_GROUP
2438{
2439 PREFIX_EXIST = 0,
2440 PREFIX_LOCK,
2441 PREFIX_REP,
04ef582a 2442 PREFIX_DS,
c32fa91d
L
2443 PREFIX_OTHER
2444};
2445
2446/* Returns
2447 a. PREFIX_EXIST if attempting to add a prefix where one from the
2448 same class already exists.
2449 b. PREFIX_LOCK if lock prefix is added.
2450 c. PREFIX_REP if rep/repne prefix is added.
04ef582a
L
2451 d. PREFIX_DS if ds prefix is added.
2452 e. PREFIX_OTHER if other prefix is added.
c32fa91d
L
2453 */
2454
2455static enum PREFIX_GROUP
e3bb37b5 2456add_prefix (unsigned int prefix)
252b5132 2457{
c32fa91d 2458 enum PREFIX_GROUP ret = PREFIX_OTHER;
b1905489 2459 unsigned int q;
252b5132 2460
29b0f896
AM
2461 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2462 && flag_code == CODE_64BIT)
b1905489 2463 {
161a04f6 2464 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
44846f29
JB
2465 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2466 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2467 || (i.prefix[REX_PREFIX] & prefix & REX_B))
c32fa91d 2468 ret = PREFIX_EXIST;
b1905489
JB
2469 q = REX_PREFIX;
2470 }
3e73aa7c 2471 else
b1905489
JB
2472 {
2473 switch (prefix)
2474 {
2475 default:
2476 abort ();
2477
b1905489 2478 case DS_PREFIX_OPCODE:
04ef582a
L
2479 ret = PREFIX_DS;
2480 /* Fall through. */
2481 case CS_PREFIX_OPCODE:
b1905489
JB
2482 case ES_PREFIX_OPCODE:
2483 case FS_PREFIX_OPCODE:
2484 case GS_PREFIX_OPCODE:
2485 case SS_PREFIX_OPCODE:
2486 q = SEG_PREFIX;
2487 break;
2488
2489 case REPNE_PREFIX_OPCODE:
2490 case REPE_PREFIX_OPCODE:
c32fa91d
L
2491 q = REP_PREFIX;
2492 ret = PREFIX_REP;
2493 break;
2494
b1905489 2495 case LOCK_PREFIX_OPCODE:
c32fa91d
L
2496 q = LOCK_PREFIX;
2497 ret = PREFIX_LOCK;
b1905489
JB
2498 break;
2499
2500 case FWAIT_OPCODE:
2501 q = WAIT_PREFIX;
2502 break;
2503
2504 case ADDR_PREFIX_OPCODE:
2505 q = ADDR_PREFIX;
2506 break;
2507
2508 case DATA_PREFIX_OPCODE:
2509 q = DATA_PREFIX;
2510 break;
2511 }
2512 if (i.prefix[q] != 0)
c32fa91d 2513 ret = PREFIX_EXIST;
b1905489 2514 }
252b5132 2515
b1905489 2516 if (ret)
252b5132 2517 {
b1905489
JB
2518 if (!i.prefix[q])
2519 ++i.prefixes;
2520 i.prefix[q] |= prefix;
252b5132 2521 }
b1905489
JB
2522 else
2523 as_bad (_("same type of prefix used twice"));
252b5132 2524
252b5132
RH
2525 return ret;
2526}
2527
2528static void
78f12dd3 2529update_code_flag (int value, int check)
eecb386c 2530{
78f12dd3
L
2531 PRINTF_LIKE ((*as_error));
2532
1e9cc1c2 2533 flag_code = (enum flag_code) value;
40fb9820
L
2534 if (flag_code == CODE_64BIT)
2535 {
2536 cpu_arch_flags.bitfield.cpu64 = 1;
2537 cpu_arch_flags.bitfield.cpuno64 = 0;
40fb9820
L
2538 }
2539 else
2540 {
2541 cpu_arch_flags.bitfield.cpu64 = 0;
2542 cpu_arch_flags.bitfield.cpuno64 = 1;
40fb9820
L
2543 }
2544 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
3e73aa7c 2545 {
78f12dd3
L
2546 if (check)
2547 as_error = as_fatal;
2548 else
2549 as_error = as_bad;
2550 (*as_error) (_("64bit mode not supported on `%s'."),
2551 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2552 }
40fb9820 2553 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
3e73aa7c 2554 {
78f12dd3
L
2555 if (check)
2556 as_error = as_fatal;
2557 else
2558 as_error = as_bad;
2559 (*as_error) (_("32bit mode not supported on `%s'."),
2560 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2561 }
eecb386c
AM
2562 stackop_size = '\0';
2563}
2564
78f12dd3
L
2565static void
2566set_code_flag (int value)
2567{
2568 update_code_flag (value, 0);
2569}
2570
eecb386c 2571static void
e3bb37b5 2572set_16bit_gcc_code_flag (int new_code_flag)
252b5132 2573{
1e9cc1c2 2574 flag_code = (enum flag_code) new_code_flag;
40fb9820
L
2575 if (flag_code != CODE_16BIT)
2576 abort ();
2577 cpu_arch_flags.bitfield.cpu64 = 0;
2578 cpu_arch_flags.bitfield.cpuno64 = 1;
9306ca4a 2579 stackop_size = LONG_MNEM_SUFFIX;
252b5132
RH
2580}
2581
2582static void
e3bb37b5 2583set_intel_syntax (int syntax_flag)
252b5132
RH
2584{
2585 /* Find out if register prefixing is specified. */
2586 int ask_naked_reg = 0;
2587
2588 SKIP_WHITESPACE ();
29b0f896 2589 if (!is_end_of_line[(unsigned char) *input_line_pointer])
252b5132 2590 {
d02603dc
NC
2591 char *string;
2592 int e = get_symbol_name (&string);
252b5132 2593
47926f60 2594 if (strcmp (string, "prefix") == 0)
252b5132 2595 ask_naked_reg = 1;
47926f60 2596 else if (strcmp (string, "noprefix") == 0)
252b5132
RH
2597 ask_naked_reg = -1;
2598 else
d0b47220 2599 as_bad (_("bad argument to syntax directive."));
d02603dc 2600 (void) restore_line_pointer (e);
252b5132
RH
2601 }
2602 demand_empty_rest_of_line ();
c3332e24 2603
252b5132
RH
2604 intel_syntax = syntax_flag;
2605
2606 if (ask_naked_reg == 0)
f86103b7
AM
2607 allow_naked_reg = (intel_syntax
2608 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
252b5132
RH
2609 else
2610 allow_naked_reg = (ask_naked_reg < 0);
9306ca4a 2611
ee86248c 2612 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
7ab9ffdd 2613
e4a3b5a4 2614 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
9306ca4a 2615 identifier_chars['$'] = intel_syntax ? '$' : 0;
e4a3b5a4 2616 register_prefix = allow_naked_reg ? "" : "%";
252b5132
RH
2617}
2618
1efbbeb4
L
2619static void
2620set_intel_mnemonic (int mnemonic_flag)
2621{
e1d4d893 2622 intel_mnemonic = mnemonic_flag;
1efbbeb4
L
2623}
2624
db51cc60
L
2625static void
2626set_allow_index_reg (int flag)
2627{
2628 allow_index_reg = flag;
2629}
2630
cb19c032 2631static void
7bab8ab5 2632set_check (int what)
cb19c032 2633{
7bab8ab5
JB
2634 enum check_kind *kind;
2635 const char *str;
2636
2637 if (what)
2638 {
2639 kind = &operand_check;
2640 str = "operand";
2641 }
2642 else
2643 {
2644 kind = &sse_check;
2645 str = "sse";
2646 }
2647
cb19c032
L
2648 SKIP_WHITESPACE ();
2649
2650 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2651 {
d02603dc
NC
2652 char *string;
2653 int e = get_symbol_name (&string);
cb19c032
L
2654
2655 if (strcmp (string, "none") == 0)
7bab8ab5 2656 *kind = check_none;
cb19c032 2657 else if (strcmp (string, "warning") == 0)
7bab8ab5 2658 *kind = check_warning;
cb19c032 2659 else if (strcmp (string, "error") == 0)
7bab8ab5 2660 *kind = check_error;
cb19c032 2661 else
7bab8ab5 2662 as_bad (_("bad argument to %s_check directive."), str);
d02603dc 2663 (void) restore_line_pointer (e);
cb19c032
L
2664 }
2665 else
7bab8ab5 2666 as_bad (_("missing argument for %s_check directive"), str);
cb19c032
L
2667
2668 demand_empty_rest_of_line ();
2669}
2670
8a9036a4
L
2671static void
2672check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
1e9cc1c2 2673 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
8a9036a4
L
2674{
2675#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2676 static const char *arch;
2677
c085ab00 2678 /* Intel MCU is only supported on ELF. */
8a9036a4
L
2679 if (!IS_ELF)
2680 return;
2681
2682 if (!arch)
2683 {
2684 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2685 use default_arch. */
2686 arch = cpu_arch_name;
2687 if (!arch)
2688 arch = default_arch;
2689 }
2690
81486035 2691 /* If we are targeting Intel MCU, we must enable it. */
648d04db
JB
2692 if ((get_elf_backend_data (stdoutput)->elf_machine_code == EM_IAMCU)
2693 == new_flag.bitfield.cpuiamcu)
81486035
L
2694 return;
2695
8a9036a4
L
2696 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2697#endif
2698}
2699
8180707f
JB
2700static void
2701extend_cpu_sub_arch_name (const char *name)
2702{
2703 if (cpu_sub_arch_name)
2704 cpu_sub_arch_name = reconcat (cpu_sub_arch_name, cpu_sub_arch_name,
ae89daec 2705 ".", name, (const char *) NULL);
8180707f 2706 else
ae89daec 2707 cpu_sub_arch_name = concat (".", name, (const char *) NULL);
8180707f
JB
2708}
2709
e413e4e9 2710static void
e3bb37b5 2711set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
e413e4e9 2712{
f68697e8
JB
2713 typedef struct arch_stack_entry
2714 {
2715 const struct arch_stack_entry *prev;
2716 const char *name;
2717 char *sub_name;
2718 i386_cpu_flags flags;
2719 i386_cpu_flags isa_flags;
2720 enum processor_type isa;
2721 enum flag_code flag_code;
2722 char stackop_size;
2723 bool no_cond_jump_promotion;
2724 } arch_stack_entry;
2725 static const arch_stack_entry *arch_stack_top;
2726
47926f60 2727 SKIP_WHITESPACE ();
e413e4e9 2728
29b0f896 2729 if (!is_end_of_line[(unsigned char) *input_line_pointer])
e413e4e9 2730 {
3ce2ebcf
JB
2731 char *s;
2732 int e = get_symbol_name (&s);
2733 const char *string = s;
2734 unsigned int j = 0;
40fb9820 2735 i386_cpu_flags flags;
e413e4e9 2736
3ce2ebcf
JB
2737 if (strcmp (string, "default") == 0)
2738 {
2739 if (strcmp (default_arch, "iamcu") == 0)
2740 string = default_arch;
2741 else
2742 {
2743 static const i386_cpu_flags cpu_unknown_flags = CPU_UNKNOWN_FLAGS;
2744
2745 cpu_arch_name = NULL;
2746 free (cpu_sub_arch_name);
2747 cpu_sub_arch_name = NULL;
2748 cpu_arch_flags = cpu_unknown_flags;
2749 if (flag_code == CODE_64BIT)
2750 {
2751 cpu_arch_flags.bitfield.cpu64 = 1;
2752 cpu_arch_flags.bitfield.cpuno64 = 0;
2753 }
2754 else
2755 {
2756 cpu_arch_flags.bitfield.cpu64 = 0;
2757 cpu_arch_flags.bitfield.cpuno64 = 1;
2758 }
2759 cpu_arch_isa = PROCESSOR_UNKNOWN;
ae89daec 2760 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].enable;
3ce2ebcf
JB
2761 if (!cpu_arch_tune_set)
2762 {
2763 cpu_arch_tune = cpu_arch_isa;
2764 cpu_arch_tune_flags = cpu_arch_isa_flags;
2765 }
2766
2767 j = ARRAY_SIZE (cpu_arch) + 1;
2768 }
2769 }
f68697e8
JB
2770 else if (strcmp (string, "push") == 0)
2771 {
2772 arch_stack_entry *top = XNEW (arch_stack_entry);
2773
2774 top->name = cpu_arch_name;
2775 if (cpu_sub_arch_name)
2776 top->sub_name = xstrdup (cpu_sub_arch_name);
2777 else
2778 top->sub_name = NULL;
2779 top->flags = cpu_arch_flags;
2780 top->isa = cpu_arch_isa;
2781 top->isa_flags = cpu_arch_isa_flags;
2782 top->flag_code = flag_code;
2783 top->stackop_size = stackop_size;
2784 top->no_cond_jump_promotion = no_cond_jump_promotion;
2785
2786 top->prev = arch_stack_top;
2787 arch_stack_top = top;
2788
2789 (void) restore_line_pointer (e);
2790 demand_empty_rest_of_line ();
2791 return;
2792 }
2793 else if (strcmp (string, "pop") == 0)
2794 {
2795 const arch_stack_entry *top = arch_stack_top;
2796
2797 if (!top)
2798 as_bad (_(".arch stack is empty"));
2799 else if (top->flag_code != flag_code
2800 || top->stackop_size != stackop_size)
2801 {
2802 static const unsigned int bits[] = {
2803 [CODE_16BIT] = 16,
2804 [CODE_32BIT] = 32,
2805 [CODE_64BIT] = 64,
2806 };
2807
2808 as_bad (_("this `.arch pop' requires `.code%u%s' to be in effect"),
2809 bits[top->flag_code],
2810 top->stackop_size == LONG_MNEM_SUFFIX ? "gcc" : "");
2811 }
2812 else
2813 {
2814 arch_stack_top = top->prev;
2815
2816 cpu_arch_name = top->name;
2817 free (cpu_sub_arch_name);
2818 cpu_sub_arch_name = top->sub_name;
2819 cpu_arch_flags = top->flags;
2820 cpu_arch_isa = top->isa;
2821 cpu_arch_isa_flags = top->isa_flags;
2822 no_cond_jump_promotion = top->no_cond_jump_promotion;
2823
2824 XDELETE (top);
2825 }
2826
2827 (void) restore_line_pointer (e);
2828 demand_empty_rest_of_line ();
2829 return;
2830 }
3ce2ebcf
JB
2831
2832 for (; j < ARRAY_SIZE (cpu_arch); j++)
e413e4e9 2833 {
ae89daec
JB
2834 if (strcmp (string + (*string == '.'), cpu_arch[j].name) == 0
2835 && (*string == '.') == (cpu_arch[j].type == PROCESSOR_NONE))
e413e4e9 2836 {
5c6af06e
JB
2837 if (*string != '.')
2838 {
ae89daec 2839 check_cpu_arch_compatible (string, cpu_arch[j].enable);
648d04db 2840
91d6fa6a 2841 cpu_arch_name = cpu_arch[j].name;
d92c7521 2842 free (cpu_sub_arch_name);
5c6af06e 2843 cpu_sub_arch_name = NULL;
ae89daec 2844 cpu_arch_flags = cpu_arch[j].enable;
40fb9820
L
2845 if (flag_code == CODE_64BIT)
2846 {
2847 cpu_arch_flags.bitfield.cpu64 = 1;
2848 cpu_arch_flags.bitfield.cpuno64 = 0;
2849 }
2850 else
2851 {
2852 cpu_arch_flags.bitfield.cpu64 = 0;
2853 cpu_arch_flags.bitfield.cpuno64 = 1;
2854 }
91d6fa6a 2855 cpu_arch_isa = cpu_arch[j].type;
ae89daec 2856 cpu_arch_isa_flags = cpu_arch[j].enable;
ccc9c027
L
2857 if (!cpu_arch_tune_set)
2858 {
2859 cpu_arch_tune = cpu_arch_isa;
2860 cpu_arch_tune_flags = cpu_arch_isa_flags;
2861 }
d59a54c2 2862 pre_386_16bit_warned = false;
5c6af06e
JB
2863 break;
2864 }
40fb9820 2865
ae89daec
JB
2866 if (cpu_flags_all_zero (&cpu_arch[j].enable))
2867 continue;
2868
293f5f65 2869 flags = cpu_flags_or (cpu_arch_flags,
ae89daec 2870 cpu_arch[j].enable);
81486035 2871
5b64d091 2872 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
5c6af06e 2873 {
ae89daec 2874 extend_cpu_sub_arch_name (string + 1);
40fb9820 2875 cpu_arch_flags = flags;
a586129e 2876 cpu_arch_isa_flags = flags;
5c6af06e 2877 }
0089dace
L
2878 else
2879 cpu_arch_isa_flags
2880 = cpu_flags_or (cpu_arch_isa_flags,
ae89daec 2881 cpu_arch[j].enable);
d02603dc 2882 (void) restore_line_pointer (e);
5c6af06e
JB
2883 demand_empty_rest_of_line ();
2884 return;
e413e4e9
AM
2885 }
2886 }
293f5f65 2887
ae89daec 2888 if (startswith (string, ".no") && j >= ARRAY_SIZE (cpu_arch))
293f5f65 2889 {
33eaf5de 2890 /* Disable an ISA extension. */
ae89daec
JB
2891 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2892 if (cpu_arch[j].type == PROCESSOR_NONE
2893 && strcmp (string + 3, cpu_arch[j].name) == 0)
293f5f65
L
2894 {
2895 flags = cpu_flags_and_not (cpu_arch_flags,
ae89daec 2896 cpu_arch[j].disable);
293f5f65
L
2897 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898 {
ae89daec 2899 extend_cpu_sub_arch_name (string + 1);
293f5f65
L
2900 cpu_arch_flags = flags;
2901 cpu_arch_isa_flags = flags;
2902 }
2903 (void) restore_line_pointer (e);
2904 demand_empty_rest_of_line ();
2905 return;
2906 }
293f5f65
L
2907 }
2908
3ce2ebcf 2909 if (j == ARRAY_SIZE (cpu_arch))
e413e4e9
AM
2910 as_bad (_("no such architecture: `%s'"), string);
2911
2912 *input_line_pointer = e;
2913 }
2914 else
2915 as_bad (_("missing cpu architecture"));
2916
fddf5b5b
AM
2917 no_cond_jump_promotion = 0;
2918 if (*input_line_pointer == ','
29b0f896 2919 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
fddf5b5b 2920 {
d02603dc
NC
2921 char *string;
2922 char e;
2923
2924 ++input_line_pointer;
2925 e = get_symbol_name (&string);
fddf5b5b
AM
2926
2927 if (strcmp (string, "nojumps") == 0)
2928 no_cond_jump_promotion = 1;
2929 else if (strcmp (string, "jumps") == 0)
2930 ;
2931 else
2932 as_bad (_("no such architecture modifier: `%s'"), string);
2933
d02603dc 2934 (void) restore_line_pointer (e);
fddf5b5b
AM
2935 }
2936
e413e4e9
AM
2937 demand_empty_rest_of_line ();
2938}
2939
8a9036a4
L
2940enum bfd_architecture
2941i386_arch (void)
2942{
c085ab00 2943 if (cpu_arch_isa == PROCESSOR_IAMCU)
81486035
L
2944 {
2945 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2946 || flag_code == CODE_64BIT)
2947 as_fatal (_("Intel MCU is 32bit ELF only"));
2948 return bfd_arch_iamcu;
2949 }
8a9036a4
L
2950 else
2951 return bfd_arch_i386;
2952}
2953
b9d79e03 2954unsigned long
7016a5d5 2955i386_mach (void)
b9d79e03 2956{
d34049e8 2957 if (startswith (default_arch, "x86_64"))
8a9036a4 2958 {
c085ab00 2959 if (default_arch[6] == '\0')
8a9036a4 2960 return bfd_mach_x86_64;
351f65ca
L
2961 else
2962 return bfd_mach_x64_32;
8a9036a4 2963 }
5197d474
L
2964 else if (!strcmp (default_arch, "i386")
2965 || !strcmp (default_arch, "iamcu"))
81486035
L
2966 {
2967 if (cpu_arch_isa == PROCESSOR_IAMCU)
2968 {
2969 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2970 as_fatal (_("Intel MCU is 32bit ELF only"));
2971 return bfd_mach_i386_iamcu;
2972 }
2973 else
2974 return bfd_mach_i386_i386;
2975 }
b9d79e03 2976 else
2b5d6a91 2977 as_fatal (_("unknown architecture"));
b9d79e03 2978}
b9d79e03 2979\f
99f0fb12
JB
2980#include "opcodes/i386-tbl.h"
2981
252b5132 2982void
7016a5d5 2983md_begin (void)
252b5132 2984{
86fa6981
L
2985 /* Support pseudo prefixes like {disp32}. */
2986 lex_type ['{'] = LEX_BEGIN_NAME;
2987
47926f60 2988 /* Initialize op_hash hash table. */
629310ab 2989 op_hash = str_htab_create ();
252b5132
RH
2990
2991 {
65f440c8
JB
2992 const insn_template *const *sets = i386_op_sets;
2993 const insn_template *const *end = sets + ARRAY_SIZE (i386_op_sets) - 1;
2994
2995 /* Type checks to compensate for the conversion through void * which
2996 occurs during hash table insertion / lookup. */
eb993861
JB
2997 (void) sizeof (sets == &current_templates->start);
2998 (void) sizeof (end == &current_templates->end);
65f440c8 2999 for (; sets < end; ++sets)
76d3f746
JB
3000 if (str_hash_insert (op_hash, insn_name (*sets), sets, 0))
3001 as_fatal (_("duplicate %s"), insn_name (*sets));
252b5132
RH
3002 }
3003
47926f60 3004 /* Initialize reg_hash hash table. */
629310ab 3005 reg_hash = str_htab_create ();
252b5132 3006 {
29b0f896 3007 const reg_entry *regtab;
c3fe08fa 3008 unsigned int regtab_size = i386_regtab_size;
252b5132 3009
c3fe08fa 3010 for (regtab = i386_regtab; regtab_size--; regtab++)
6225c532 3011 {
6288d05f
JB
3012 switch (regtab->reg_type.bitfield.class)
3013 {
3014 case Reg:
34684862
JB
3015 if (regtab->reg_type.bitfield.dword)
3016 {
3017 if (regtab->reg_type.bitfield.instance == Accum)
3018 reg_eax = regtab;
3019 }
3020 else if (regtab->reg_type.bitfield.tbyte)
6288d05f
JB
3021 {
3022 /* There's no point inserting st(<N>) in the hash table, as
3023 parentheses aren't included in register_chars[] anyway. */
3024 if (regtab->reg_type.bitfield.instance != Accum)
3025 continue;
3026 reg_st0 = regtab;
3027 }
3028 break;
3029
5e042380
JB
3030 case SReg:
3031 switch (regtab->reg_num)
3032 {
3033 case 0: reg_es = regtab; break;
3034 case 2: reg_ss = regtab; break;
3035 case 3: reg_ds = regtab; break;
3036 }
3037 break;
3038
6288d05f
JB
3039 case RegMask:
3040 if (!regtab->reg_num)
3041 reg_k0 = regtab;
3042 break;
3043 }
3044
6225c532
JB
3045 if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3046 as_fatal (_("duplicate %s"), regtab->reg_name);
6225c532 3047 }
252b5132
RH
3048 }
3049
47926f60 3050 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
252b5132 3051 {
29b0f896
AM
3052 int c;
3053 char *p;
252b5132
RH
3054
3055 for (c = 0; c < 256; c++)
3056 {
014fbcda 3057 if (ISDIGIT (c) || ISLOWER (c))
252b5132
RH
3058 {
3059 mnemonic_chars[c] = c;
3060 register_chars[c] = c;
3061 operand_chars[c] = c;
3062 }
3882b010 3063 else if (ISUPPER (c))
252b5132 3064 {
3882b010 3065 mnemonic_chars[c] = TOLOWER (c);
252b5132
RH
3066 register_chars[c] = mnemonic_chars[c];
3067 operand_chars[c] = c;
3068 }
43234a1e 3069 else if (c == '{' || c == '}')
86fa6981
L
3070 {
3071 mnemonic_chars[c] = c;
3072 operand_chars[c] = c;
3073 }
b3983e5f
JB
3074#ifdef SVR4_COMMENT_CHARS
3075 else if (c == '\\' && strchr (i386_comment_chars, '/'))
3076 operand_chars[c] = c;
3077#endif
252b5132 3078
3882b010 3079 if (ISALPHA (c) || ISDIGIT (c))
252b5132
RH
3080 identifier_chars[c] = c;
3081 else if (c >= 128)
3082 {
3083 identifier_chars[c] = c;
3084 operand_chars[c] = c;
3085 }
3086 }
3087
3088#ifdef LEX_AT
3089 identifier_chars['@'] = '@';
32137342
NC
3090#endif
3091#ifdef LEX_QM
3092 identifier_chars['?'] = '?';
3093 operand_chars['?'] = '?';
252b5132 3094#endif
c0f3af97 3095 mnemonic_chars['_'] = '_';
791fe849 3096 mnemonic_chars['-'] = '-';
0003779b 3097 mnemonic_chars['.'] = '.';
252b5132
RH
3098 identifier_chars['_'] = '_';
3099 identifier_chars['.'] = '.';
3100
3101 for (p = operand_special_chars; *p != '\0'; p++)
3102 operand_chars[(unsigned char) *p] = *p;
3103 }
3104
a4447b93
RH
3105 if (flag_code == CODE_64BIT)
3106 {
ca19b261
KT
3107#if defined (OBJ_COFF) && defined (TE_PE)
3108 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3109 ? 32 : 16);
3110#else
a4447b93 3111 x86_dwarf2_return_column = 16;
ca19b261 3112#endif
61ff971f 3113 x86_cie_data_alignment = -8;
b52c4ee4
IB
3114#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3115 x86_sframe_cfa_sp_reg = 7;
3116 x86_sframe_cfa_fp_reg = 6;
3117#endif
a4447b93
RH
3118 }
3119 else
3120 {
3121 x86_dwarf2_return_column = 8;
3122 x86_cie_data_alignment = -4;
3123 }
e379e5f3
L
3124
3125 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3126 can be turned into BRANCH_PREFIX frag. */
3127 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3128 abort ();
252b5132
RH
3129}
3130
3131void
e3bb37b5 3132i386_print_statistics (FILE *file)
252b5132 3133{
629310ab
ML
3134 htab_print_statistics (file, "i386 opcode", op_hash);
3135 htab_print_statistics (file, "i386 register", reg_hash);
252b5132 3136}
654d6f31
AM
3137
3138void
3139i386_md_end (void)
3140{
3141 htab_delete (op_hash);
3142 htab_delete (reg_hash);
3143}
252b5132 3144\f
252b5132
RH
3145#ifdef DEBUG386
3146
ce8a8b2f 3147/* Debugging routines for md_assemble. */
d3ce72d0 3148static void pte (insn_template *);
40fb9820 3149static void pt (i386_operand_type);
e3bb37b5
L
3150static void pe (expressionS *);
3151static void ps (symbolS *);
252b5132
RH
3152
3153static void
2c703856 3154pi (const char *line, i386_insn *x)
252b5132 3155{
09137c09 3156 unsigned int j;
252b5132
RH
3157
3158 fprintf (stdout, "%s: template ", line);
3159 pte (&x->tm);
09f131f2
JH
3160 fprintf (stdout, " address: base %s index %s scale %x\n",
3161 x->base_reg ? x->base_reg->reg_name : "none",
3162 x->index_reg ? x->index_reg->reg_name : "none",
3163 x->log2_scale_factor);
3164 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
252b5132 3165 x->rm.mode, x->rm.reg, x->rm.regmem);
09f131f2
JH
3166 fprintf (stdout, " sib: base %x index %x scale %x\n",
3167 x->sib.base, x->sib.index, x->sib.scale);
3168 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
161a04f6
L
3169 (x->rex & REX_W) != 0,
3170 (x->rex & REX_R) != 0,
3171 (x->rex & REX_X) != 0,
3172 (x->rex & REX_B) != 0);
09137c09 3173 for (j = 0; j < x->operands; j++)
252b5132 3174 {
09137c09
SP
3175 fprintf (stdout, " #%d: ", j + 1);
3176 pt (x->types[j]);
252b5132 3177 fprintf (stdout, "\n");
bab6aec1 3178 if (x->types[j].bitfield.class == Reg
3528c362
JB
3179 || x->types[j].bitfield.class == RegMMX
3180 || x->types[j].bitfield.class == RegSIMD
dd6b8a0b 3181 || x->types[j].bitfield.class == RegMask
00cee14f 3182 || x->types[j].bitfield.class == SReg
4a5c67ed
JB
3183 || x->types[j].bitfield.class == RegCR
3184 || x->types[j].bitfield.class == RegDR
dd6b8a0b
JB
3185 || x->types[j].bitfield.class == RegTR
3186 || x->types[j].bitfield.class == RegBND)
09137c09
SP
3187 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3188 if (operand_type_check (x->types[j], imm))
3189 pe (x->op[j].imms);
3190 if (operand_type_check (x->types[j], disp))
3191 pe (x->op[j].disps);
252b5132
RH
3192 }
3193}
3194
3195static void
d3ce72d0 3196pte (insn_template *t)
252b5132 3197{
b933fa4b 3198 static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
441f6aca 3199 static const char *const opc_spc[] = {
0cc78721 3200 NULL, "0f", "0f38", "0f3a", NULL, "evexmap5", "evexmap6", NULL,
441f6aca
JB
3201 "XOP08", "XOP09", "XOP0A",
3202 };
09137c09 3203 unsigned int j;
441f6aca 3204
252b5132 3205 fprintf (stdout, " %d operands ", t->operands);
441f6aca
JB
3206 if (opc_pfx[t->opcode_modifier.opcodeprefix])
3207 fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
ddb62495
JB
3208 if (opc_spc[t->opcode_space])
3209 fprintf (stdout, "space %s ", opc_spc[t->opcode_space]);
47926f60 3210 fprintf (stdout, "opcode %x ", t->base_opcode);
252b5132
RH
3211 if (t->extension_opcode != None)
3212 fprintf (stdout, "ext %x ", t->extension_opcode);
40fb9820 3213 if (t->opcode_modifier.d)
252b5132 3214 fprintf (stdout, "D");
40fb9820 3215 if (t->opcode_modifier.w)
252b5132
RH
3216 fprintf (stdout, "W");
3217 fprintf (stdout, "\n");
09137c09 3218 for (j = 0; j < t->operands; j++)
252b5132 3219 {
09137c09
SP
3220 fprintf (stdout, " #%d type ", j + 1);
3221 pt (t->operand_types[j]);
252b5132
RH
3222 fprintf (stdout, "\n");
3223 }
3224}
3225
3226static void
e3bb37b5 3227pe (expressionS *e)
252b5132 3228{
24eab124 3229 fprintf (stdout, " operation %d\n", e->X_op);
b8281767
AM
3230 fprintf (stdout, " add_number %" PRId64 " (%" PRIx64 ")\n",
3231 (int64_t) e->X_add_number, (uint64_t) (valueT) e->X_add_number);
252b5132
RH
3232 if (e->X_add_symbol)
3233 {
3234 fprintf (stdout, " add_symbol ");
3235 ps (e->X_add_symbol);
3236 fprintf (stdout, "\n");
3237 }
3238 if (e->X_op_symbol)
3239 {
3240 fprintf (stdout, " op_symbol ");
3241 ps (e->X_op_symbol);
3242 fprintf (stdout, "\n");
3243 }
3244}
3245
3246static void
e3bb37b5 3247ps (symbolS *s)
252b5132
RH
3248{
3249 fprintf (stdout, "%s type %s%s",
3250 S_GET_NAME (s),
3251 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3252 segment_name (S_GET_SEGMENT (s)));
3253}
3254
7b81dfbb 3255static struct type_name
252b5132 3256 {
40fb9820
L
3257 i386_operand_type mask;
3258 const char *name;
252b5132 3259 }
7b81dfbb 3260const type_names[] =
252b5132 3261{
05909f23
JB
3262 { { .bitfield = { .class = Reg, .byte = 1 } }, "r8" },
3263 { { .bitfield = { .class = Reg, .word = 1 } }, "r16" },
3264 { { .bitfield = { .class = Reg, .dword = 1 } }, "r32" },
3265 { { .bitfield = { .class = Reg, .qword = 1 } }, "r64" },
3266 { { .bitfield = { .instance = Accum, .byte = 1 } }, "acc8" },
3267 { { .bitfield = { .instance = Accum, .word = 1 } }, "acc16" },
3268 { { .bitfield = { .instance = Accum, .dword = 1 } }, "acc32" },
3269 { { .bitfield = { .instance = Accum, .qword = 1 } }, "acc64" },
3270 { { .bitfield = { .imm8 = 1 } }, "i8" },
3271 { { .bitfield = { .imm8s = 1 } }, "i8s" },
3272 { { .bitfield = { .imm16 = 1 } }, "i16" },
3273 { { .bitfield = { .imm32 = 1 } }, "i32" },
3274 { { .bitfield = { .imm32s = 1 } }, "i32s" },
3275 { { .bitfield = { .imm64 = 1 } }, "i64" },
3276 { { .bitfield = { .imm1 = 1 } }, "i1" },
3277 { { .bitfield = { .baseindex = 1 } }, "BaseIndex" },
3278 { { .bitfield = { .disp8 = 1 } }, "d8" },
3279 { { .bitfield = { .disp16 = 1 } }, "d16" },
3280 { { .bitfield = { .disp32 = 1 } }, "d32" },
3281 { { .bitfield = { .disp64 = 1 } }, "d64" },
3282 { { .bitfield = { .instance = RegD, .word = 1 } }, "InOutPortReg" },
3283 { { .bitfield = { .instance = RegC, .byte = 1 } }, "ShiftCount" },
3284 { { .bitfield = { .class = RegCR } }, "control reg" },
3285 { { .bitfield = { .class = RegTR } }, "test reg" },
3286 { { .bitfield = { .class = RegDR } }, "debug reg" },
3287 { { .bitfield = { .class = Reg, .tbyte = 1 } }, "FReg" },
3288 { { .bitfield = { .instance = Accum, .tbyte = 1 } }, "FAcc" },
3289 { { .bitfield = { .class = SReg } }, "SReg" },
3290 { { .bitfield = { .class = RegMMX } }, "rMMX" },
3291 { { .bitfield = { .class = RegSIMD, .xmmword = 1 } }, "rXMM" },
3292 { { .bitfield = { .class = RegSIMD, .ymmword = 1 } }, "rYMM" },
3293 { { .bitfield = { .class = RegSIMD, .zmmword = 1 } }, "rZMM" },
3294 { { .bitfield = { .class = RegSIMD, .tmmword = 1 } }, "rTMM" },
3295 { { .bitfield = { .class = RegMask } }, "Mask reg" },
252b5132
RH
3296};
3297
3298static void
40fb9820 3299pt (i386_operand_type t)
252b5132 3300{
40fb9820 3301 unsigned int j;
c6fb90c8 3302 i386_operand_type a;
252b5132 3303
40fb9820 3304 for (j = 0; j < ARRAY_SIZE (type_names); j++)
c6fb90c8
L
3305 {
3306 a = operand_type_and (t, type_names[j].mask);
2c703856 3307 if (operand_type_equal (&a, &type_names[j].mask))
c6fb90c8
L
3308 fprintf (stdout, "%s, ", type_names[j].name);
3309 }
252b5132
RH
3310 fflush (stdout);
3311}
3312
3313#endif /* DEBUG386 */
3314\f
252b5132 3315static bfd_reloc_code_real_type
3956db08 3316reloc (unsigned int size,
64e74474
AM
3317 int pcrel,
3318 int sign,
3319 bfd_reloc_code_real_type other)
252b5132 3320{
47926f60 3321 if (other != NO_RELOC)
3956db08 3322 {
91d6fa6a 3323 reloc_howto_type *rel;
3956db08
JB
3324
3325 if (size == 8)
3326 switch (other)
3327 {
64e74474
AM
3328 case BFD_RELOC_X86_64_GOT32:
3329 return BFD_RELOC_X86_64_GOT64;
3330 break;
553d1284
L
3331 case BFD_RELOC_X86_64_GOTPLT64:
3332 return BFD_RELOC_X86_64_GOTPLT64;
3333 break;
64e74474
AM
3334 case BFD_RELOC_X86_64_PLTOFF64:
3335 return BFD_RELOC_X86_64_PLTOFF64;
3336 break;
3337 case BFD_RELOC_X86_64_GOTPC32:
3338 other = BFD_RELOC_X86_64_GOTPC64;
3339 break;
3340 case BFD_RELOC_X86_64_GOTPCREL:
3341 other = BFD_RELOC_X86_64_GOTPCREL64;
3342 break;
3343 case BFD_RELOC_X86_64_TPOFF32:
3344 other = BFD_RELOC_X86_64_TPOFF64;
3345 break;
3346 case BFD_RELOC_X86_64_DTPOFF32:
3347 other = BFD_RELOC_X86_64_DTPOFF64;
3348 break;
3349 default:
3350 break;
3956db08 3351 }
e05278af 3352
8ce3d284 3353#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
3354 if (other == BFD_RELOC_SIZE32)
3355 {
3356 if (size == 8)
1ab668bf 3357 other = BFD_RELOC_SIZE64;
8fd4256d 3358 if (pcrel)
1ab668bf
AM
3359 {
3360 as_bad (_("there are no pc-relative size relocations"));
3361 return NO_RELOC;
3362 }
8fd4256d 3363 }
8ce3d284 3364#endif
8fd4256d 3365
e05278af 3366 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
f2d8a97c 3367 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
e05278af
JB
3368 sign = -1;
3369
91d6fa6a
NC
3370 rel = bfd_reloc_type_lookup (stdoutput, other);
3371 if (!rel)
3956db08 3372 as_bad (_("unknown relocation (%u)"), other);
91d6fa6a 3373 else if (size != bfd_get_reloc_size (rel))
3956db08 3374 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
91d6fa6a 3375 bfd_get_reloc_size (rel),
3956db08 3376 size);
91d6fa6a 3377 else if (pcrel && !rel->pc_relative)
3956db08 3378 as_bad (_("non-pc-relative relocation for pc-relative field"));
91d6fa6a 3379 else if ((rel->complain_on_overflow == complain_overflow_signed
3956db08 3380 && !sign)
91d6fa6a 3381 || (rel->complain_on_overflow == complain_overflow_unsigned
64e74474 3382 && sign > 0))
3956db08
JB
3383 as_bad (_("relocated field and relocation type differ in signedness"));
3384 else
3385 return other;
3386 return NO_RELOC;
3387 }
252b5132
RH
3388
3389 if (pcrel)
3390 {
3e73aa7c 3391 if (!sign)
3956db08 3392 as_bad (_("there are no unsigned pc-relative relocations"));
252b5132
RH
3393 switch (size)
3394 {
3395 case 1: return BFD_RELOC_8_PCREL;
3396 case 2: return BFD_RELOC_16_PCREL;
d258b828 3397 case 4: return BFD_RELOC_32_PCREL;
d6ab8113 3398 case 8: return BFD_RELOC_64_PCREL;
252b5132 3399 }
3956db08 3400 as_bad (_("cannot do %u byte pc-relative relocation"), size);
252b5132
RH
3401 }
3402 else
3403 {
3956db08 3404 if (sign > 0)
e5cb08ac 3405 switch (size)
3e73aa7c
JH
3406 {
3407 case 4: return BFD_RELOC_X86_64_32S;
3408 }
3409 else
3410 switch (size)
3411 {
3412 case 1: return BFD_RELOC_8;
3413 case 2: return BFD_RELOC_16;
3414 case 4: return BFD_RELOC_32;
3415 case 8: return BFD_RELOC_64;
3416 }
3956db08
JB
3417 as_bad (_("cannot do %s %u byte relocation"),
3418 sign > 0 ? "signed" : "unsigned", size);
252b5132
RH
3419 }
3420
0cc9e1d3 3421 return NO_RELOC;
252b5132
RH
3422}
3423
47926f60
KH
3424/* Here we decide which fixups can be adjusted to make them relative to
3425 the beginning of the section instead of the symbol. Basically we need
3426 to make sure that the dynamic relocations are done correctly, so in
3427 some cases we force the original symbol to be used. */
3428
252b5132 3429int
e3bb37b5 3430tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
252b5132 3431{
6d249963 3432#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 3433 if (!IS_ELF)
31312f95
AM
3434 return 1;
3435
a161fe53
AM
3436 /* Don't adjust pc-relative references to merge sections in 64-bit
3437 mode. */
3438 if (use_rela_relocations
3439 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3440 && fixP->fx_pcrel)
252b5132 3441 return 0;
31312f95 3442
8d01d9a9
AJ
3443 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3444 and changed later by validate_fix. */
3445 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3446 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3447 return 0;
3448
8fd4256d
L
3449 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3450 for size relocations. */
3451 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3452 || fixP->fx_r_type == BFD_RELOC_SIZE64
3453 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
252b5132 3454 || fixP->fx_r_type == BFD_RELOC_386_GOT32
02a86693 3455 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
13ae64f3
JJ
3456 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3457 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3458 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3459 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
37e55690
JJ
3460 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3461 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
13ae64f3
JJ
3462 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3463 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
67a4f2b7
AO
3464 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3465 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3e73aa7c 3466 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
80b3ee89 3467 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
56ceb5b5
L
3468 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3469 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
bffbf940
JJ
3470 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3471 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3472 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
d6ab8113 3473 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
bffbf940
JJ
3474 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3475 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
d6ab8113
JB
3476 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3477 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
67a4f2b7
AO
3478 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3479 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
252b5132
RH
3480 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3481 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3482 return 0;
31312f95 3483#endif
252b5132
RH
3484 return 1;
3485}
252b5132 3486
a9aabc23
JB
3487static INLINE bool
3488want_disp32 (const insn_template *t)
3489{
3490 return flag_code != CODE_64BIT
3491 || i.prefix[ADDR_PREFIX]
7fc69528 3492 || (t->mnem_off == MN_lea
fe134c65
JB
3493 && (!i.types[1].bitfield.qword
3494 || t->opcode_modifier.size == SIZE32));
a9aabc23
JB
3495}
3496
b4cac588 3497static int
e3bb37b5 3498intel_float_operand (const char *mnemonic)
252b5132 3499{
9306ca4a
JB
3500 /* Note that the value returned is meaningful only for opcodes with (memory)
3501 operands, hence the code here is free to improperly handle opcodes that
3502 have no operands (for better performance and smaller code). */
3503
3504 if (mnemonic[0] != 'f')
3505 return 0; /* non-math */
3506
3507 switch (mnemonic[1])
3508 {
3509 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3510 the fs segment override prefix not currently handled because no
3511 call path can make opcodes without operands get here */
3512 case 'i':
3513 return 2 /* integer op */;
3514 case 'l':
3515 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3516 return 3; /* fldcw/fldenv */
3517 break;
3518 case 'n':
3519 if (mnemonic[2] != 'o' /* fnop */)
3520 return 3; /* non-waiting control op */
3521 break;
3522 case 'r':
3523 if (mnemonic[2] == 's')
3524 return 3; /* frstor/frstpm */
3525 break;
3526 case 's':
3527 if (mnemonic[2] == 'a')
3528 return 3; /* fsave */
3529 if (mnemonic[2] == 't')
3530 {
3531 switch (mnemonic[3])
3532 {
3533 case 'c': /* fstcw */
3534 case 'd': /* fstdw */
3535 case 'e': /* fstenv */
3536 case 's': /* fsts[gw] */
3537 return 3;
3538 }
3539 }
3540 break;
3541 case 'x':
3542 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3543 return 0; /* fxsave/fxrstor are not really math ops */
3544 break;
3545 }
252b5132 3546
9306ca4a 3547 return 1;
252b5132
RH
3548}
3549
9a182d04
JB
3550static INLINE void
3551install_template (const insn_template *t)
3552{
3553 unsigned int l;
3554
3555 i.tm = *t;
3556
3557 /* Note that for pseudo prefixes this produces a length of 1. But for them
3558 the length isn't interesting at all. */
3559 for (l = 1; l < 4; ++l)
3560 if (!(t->base_opcode >> (8 * l)))
3561 break;
3562
3563 i.opcode_length = l;
3564}
3565
c0f3af97
L
3566/* Build the VEX prefix. */
3567
3568static void
d3ce72d0 3569build_vex_prefix (const insn_template *t)
c0f3af97
L
3570{
3571 unsigned int register_specifier;
c0f3af97 3572 unsigned int vector_length;
03751133 3573 unsigned int w;
c0f3af97
L
3574
3575 /* Check register specifier. */
3576 if (i.vex.register_specifier)
43234a1e
L
3577 {
3578 register_specifier =
3579 ~register_number (i.vex.register_specifier) & 0xf;
3580 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3581 }
c0f3af97
L
3582 else
3583 register_specifier = 0xf;
3584
79f0fa25
L
3585 /* Use 2-byte VEX prefix by swapping destination and source operand
3586 if there are more than 1 register operand. */
3587 if (i.reg_operands > 1
3588 && i.vec_encoding != vex_encoding_vex3
86fa6981 3589 && i.dir_encoding == dir_encoding_default
fa99fab2 3590 && i.operands == i.reg_operands
dbbc8b7e 3591 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
ddb62495 3592 && i.tm.opcode_space == SPACE_0F
dbbc8b7e 3593 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
fa99fab2
L
3594 && i.rex == REX_B)
3595 {
67748abf 3596 unsigned int xchg;
fa99fab2 3597
67748abf 3598 swap_2_operands (0, i.operands - 1);
fa99fab2 3599
9c2799c2 3600 gas_assert (i.rm.mode == 3);
fa99fab2
L
3601
3602 i.rex = REX_R;
3603 xchg = i.rm.regmem;
3604 i.rm.regmem = i.rm.reg;
3605 i.rm.reg = xchg;
3606
dbbc8b7e
JB
3607 if (i.tm.opcode_modifier.d)
3608 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
2c735193 3609 ? Opcode_ExtD : Opcode_SIMD_IntD;
dbbc8b7e 3610 else /* Use the next insn. */
9a182d04 3611 install_template (&t[1]);
fa99fab2
L
3612 }
3613
79dec6b7
JB
3614 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3615 are no memory operands and at least 3 register ones. */
3616 if (i.reg_operands >= 3
3617 && i.vec_encoding != vex_encoding_vex3
3618 && i.reg_operands == i.operands - i.imm_operands
3619 && i.tm.opcode_modifier.vex
3620 && i.tm.opcode_modifier.commutative
33740f21
JB
3621 && (i.tm.opcode_modifier.sse2avx
3622 || (optimize > 1 && !i.no_optimize))
79dec6b7
JB
3623 && i.rex == REX_B
3624 && i.vex.register_specifier
3625 && !(i.vex.register_specifier->reg_flags & RegRex))
3626 {
3627 unsigned int xchg = i.operands - i.reg_operands;
79dec6b7 3628
ddb62495 3629 gas_assert (i.tm.opcode_space == SPACE_0F);
79dec6b7
JB
3630 gas_assert (!i.tm.opcode_modifier.sae);
3631 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3632 &i.types[i.operands - 3]));
3633 gas_assert (i.rm.mode == 3);
3634
67748abf 3635 swap_2_operands (xchg, xchg + 1);
79dec6b7
JB
3636
3637 i.rex = 0;
3638 xchg = i.rm.regmem | 8;
3639 i.rm.regmem = ~register_specifier & 0xf;
3640 gas_assert (!(i.rm.regmem & 8));
3641 i.vex.register_specifier += xchg - i.rm.regmem;
3642 register_specifier = ~xchg & 0xf;
3643 }
3644
539f890d
L
3645 if (i.tm.opcode_modifier.vex == VEXScalar)
3646 vector_length = avxscalar;
10c17abd
JB
3647 else if (i.tm.opcode_modifier.vex == VEX256)
3648 vector_length = 1;
539f890d 3649 else
10c17abd 3650 {
56522fc5 3651 unsigned int op;
10c17abd 3652
c7213af9
L
3653 /* Determine vector length from the last multi-length vector
3654 operand. */
10c17abd 3655 vector_length = 0;
56522fc5 3656 for (op = t->operands; op--;)
10c17abd
JB
3657 if (t->operand_types[op].bitfield.xmmword
3658 && t->operand_types[op].bitfield.ymmword
3659 && i.types[op].bitfield.ymmword)
3660 {
3661 vector_length = 1;
3662 break;
3663 }
3664 }
c0f3af97 3665
03751133
L
3666 /* Check the REX.W bit and VEXW. */
3667 if (i.tm.opcode_modifier.vexw == VEXWIG)
3668 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3669 else if (i.tm.opcode_modifier.vexw)
3670 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3671 else
931d03b7 3672 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
03751133 3673
c0f3af97 3674 /* Use 2-byte VEX prefix if possible. */
03751133
L
3675 if (w == 0
3676 && i.vec_encoding != vex_encoding_vex3
ddb62495 3677 && i.tm.opcode_space == SPACE_0F
c0f3af97
L
3678 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3679 {
3680 /* 2-byte VEX prefix. */
3681 unsigned int r;
3682
3683 i.vex.length = 2;
3684 i.vex.bytes[0] = 0xc5;
3685
3686 /* Check the REX.R bit. */
3687 r = (i.rex & REX_R) ? 0 : 1;
3688 i.vex.bytes[1] = (r << 7
3689 | register_specifier << 3
3690 | vector_length << 2
35648716 3691 | i.tm.opcode_modifier.opcodeprefix);
c0f3af97
L
3692 }
3693 else
3694 {
3695 /* 3-byte VEX prefix. */
f88c9eb0 3696 i.vex.length = 3;
f88c9eb0 3697
ddb62495 3698 switch (i.tm.opcode_space)
5dd85c99 3699 {
441f6aca
JB
3700 case SPACE_0F:
3701 case SPACE_0F38:
3702 case SPACE_0F3A:
80de6e00 3703 i.vex.bytes[0] = 0xc4;
7f399153 3704 break;
441f6aca
JB
3705 case SPACE_XOP08:
3706 case SPACE_XOP09:
3707 case SPACE_XOP0A:
f88c9eb0 3708 i.vex.bytes[0] = 0x8f;
7f399153
L
3709 break;
3710 default:
3711 abort ();
f88c9eb0 3712 }
c0f3af97 3713
c0f3af97
L
3714 /* The high 3 bits of the second VEX byte are 1's compliment
3715 of RXB bits from REX. */
ddb62495 3716 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_space;
c0f3af97 3717
c0f3af97
L
3718 i.vex.bytes[2] = (w << 7
3719 | register_specifier << 3
3720 | vector_length << 2
35648716 3721 | i.tm.opcode_modifier.opcodeprefix);
c0f3af97
L
3722 }
3723}
3724
5b7c81bd 3725static INLINE bool
e771e7c9
JB
3726is_evex_encoding (const insn_template *t)
3727{
7091c612 3728 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
e771e7c9 3729 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
a80195f1 3730 || t->opcode_modifier.sae;
e771e7c9
JB
3731}
3732
5b7c81bd 3733static INLINE bool
7a8655d2
JB
3734is_any_vex_encoding (const insn_template *t)
3735{
7b47a312 3736 return t->opcode_modifier.vex || is_evex_encoding (t);
7a8655d2
JB
3737}
3738
a5748e0d
JB
3739static unsigned int
3740get_broadcast_bytes (const insn_template *t, bool diag)
3741{
3742 unsigned int op, bytes;
3743 const i386_operand_type *types;
3744
3745 if (i.broadcast.type)
9b345ce8 3746 return (1 << (t->opcode_modifier.broadcast - 1)) * i.broadcast.type;
a5748e0d
JB
3747
3748 gas_assert (intel_syntax);
3749
3750 for (op = 0; op < t->operands; ++op)
3751 if (t->operand_types[op].bitfield.baseindex)
3752 break;
3753
3754 gas_assert (op < t->operands);
3755
3756 if (t->opcode_modifier.evex
3757 && t->opcode_modifier.evex != EVEXDYN)
3758 switch (i.broadcast.bytes)
3759 {
3760 case 1:
3761 if (t->operand_types[op].bitfield.word)
3762 return 2;
3763 /* Fall through. */
3764 case 2:
3765 if (t->operand_types[op].bitfield.dword)
3766 return 4;
3767 /* Fall through. */
3768 case 4:
3769 if (t->operand_types[op].bitfield.qword)
3770 return 8;
3771 /* Fall through. */
3772 case 8:
3773 if (t->operand_types[op].bitfield.xmmword)
3774 return 16;
3775 if (t->operand_types[op].bitfield.ymmword)
3776 return 32;
3777 if (t->operand_types[op].bitfield.zmmword)
3778 return 64;
3779 /* Fall through. */
3780 default:
3781 abort ();
3782 }
3783
3784 gas_assert (op + 1 < t->operands);
3785
3786 if (t->operand_types[op + 1].bitfield.xmmword
3787 + t->operand_types[op + 1].bitfield.ymmword
3788 + t->operand_types[op + 1].bitfield.zmmword > 1)
3789 {
3790 types = &i.types[op + 1];
3791 diag = false;
3792 }
3793 else /* Ambiguous - guess with a preference to non-AVX512VL forms. */
3794 types = &t->operand_types[op];
3795
3796 if (types->bitfield.zmmword)
3797 bytes = 64;
3798 else if (types->bitfield.ymmword)
3799 bytes = 32;
3800 else
3801 bytes = 16;
3802
3803 if (diag)
3804 as_warn (_("ambiguous broadcast for `%s', using %u-bit form"),
76d3f746 3805 insn_name (t), bytes * 8);
a5748e0d
JB
3806
3807 return bytes;
3808}
3809
43234a1e
L
3810/* Build the EVEX prefix. */
3811
3812static void
3813build_evex_prefix (void)
3814{
35648716 3815 unsigned int register_specifier, w;
43234a1e
L
3816 rex_byte vrex_used = 0;
3817
3818 /* Check register specifier. */
3819 if (i.vex.register_specifier)
3820 {
3821 gas_assert ((i.vrex & REX_X) == 0);
3822
3823 register_specifier = i.vex.register_specifier->reg_num;
3824 if ((i.vex.register_specifier->reg_flags & RegRex))
3825 register_specifier += 8;
3826 /* The upper 16 registers are encoded in the fourth byte of the
3827 EVEX prefix. */
3828 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3829 i.vex.bytes[3] = 0x8;
3830 register_specifier = ~register_specifier & 0xf;
3831 }
3832 else
3833 {
3834 register_specifier = 0xf;
3835
3836 /* Encode upper 16 vector index register in the fourth byte of
3837 the EVEX prefix. */
3838 if (!(i.vrex & REX_X))
3839 i.vex.bytes[3] = 0x8;
3840 else
3841 vrex_used |= REX_X;
3842 }
3843
43234a1e
L
3844 /* 4 byte EVEX prefix. */
3845 i.vex.length = 4;
3846 i.vex.bytes[0] = 0x62;
3847
43234a1e
L
3848 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3849 bits from REX. */
ddb62495
JB
3850 gas_assert (i.tm.opcode_space >= SPACE_0F);
3851 gas_assert (i.tm.opcode_space <= SPACE_EVEXMAP6);
3852 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_space;
43234a1e
L
3853
3854 /* The fifth bit of the second EVEX byte is 1's compliment of the
3855 REX_R bit in VREX. */
3856 if (!(i.vrex & REX_R))
3857 i.vex.bytes[1] |= 0x10;
3858 else
3859 vrex_used |= REX_R;
3860
3861 if ((i.reg_operands + i.imm_operands) == i.operands)
3862 {
3863 /* When all operands are registers, the REX_X bit in REX is not
3864 used. We reuse it to encode the upper 16 registers, which is
3865 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3866 as 1's compliment. */
3867 if ((i.vrex & REX_B))
3868 {
3869 vrex_used |= REX_B;
3870 i.vex.bytes[1] &= ~0x40;
3871 }
3872 }
3873
3874 /* EVEX instructions shouldn't need the REX prefix. */
3875 i.vrex &= ~vrex_used;
3876 gas_assert (i.vrex == 0);
3877
6865c043
L
3878 /* Check the REX.W bit and VEXW. */
3879 if (i.tm.opcode_modifier.vexw == VEXWIG)
3880 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881 else if (i.tm.opcode_modifier.vexw)
3882 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883 else
931d03b7 3884 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
43234a1e 3885
43234a1e 3886 /* The third byte of the EVEX prefix. */
35648716
JB
3887 i.vex.bytes[2] = ((w << 7)
3888 | (register_specifier << 3)
3889 | 4 /* Encode the U bit. */
3890 | i.tm.opcode_modifier.opcodeprefix);
43234a1e
L
3891
3892 /* The fourth byte of the EVEX prefix. */
3893 /* The zeroing-masking bit. */
6225c532 3894 if (i.mask.reg && i.mask.zeroing)
43234a1e
L
3895 i.vex.bytes[3] |= 0x80;
3896
3897 /* Don't always set the broadcast bit if there is no RC. */
ca5312a2 3898 if (i.rounding.type == rc_none)
43234a1e
L
3899 {
3900 /* Encode the vector length. */
3901 unsigned int vec_length;
3902
e771e7c9
JB
3903 if (!i.tm.opcode_modifier.evex
3904 || i.tm.opcode_modifier.evex == EVEXDYN)
3905 {
56522fc5 3906 unsigned int op;
e771e7c9 3907
c7213af9
L
3908 /* Determine vector length from the last multi-length vector
3909 operand. */
56522fc5 3910 for (op = i.operands; op--;)
e771e7c9
JB
3911 if (i.tm.operand_types[op].bitfield.xmmword
3912 + i.tm.operand_types[op].bitfield.ymmword
3913 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914 {
3915 if (i.types[op].bitfield.zmmword)
c7213af9
L
3916 {
3917 i.tm.opcode_modifier.evex = EVEX512;
3918 break;
3919 }
e771e7c9 3920 else if (i.types[op].bitfield.ymmword)
c7213af9
L
3921 {
3922 i.tm.opcode_modifier.evex = EVEX256;
3923 break;
3924 }
e771e7c9 3925 else if (i.types[op].bitfield.xmmword)
c7213af9
L
3926 {
3927 i.tm.opcode_modifier.evex = EVEX128;
3928 break;
3929 }
9b345ce8
JB
3930 else if ((i.broadcast.type || i.broadcast.bytes)
3931 && op == i.broadcast.operand)
625cbd7a 3932 {
a5748e0d 3933 switch (get_broadcast_bytes (&i.tm, true))
625cbd7a
JB
3934 {
3935 case 64:
3936 i.tm.opcode_modifier.evex = EVEX512;
3937 break;
3938 case 32:
3939 i.tm.opcode_modifier.evex = EVEX256;
3940 break;
3941 case 16:
3942 i.tm.opcode_modifier.evex = EVEX128;
3943 break;
3944 default:
c7213af9 3945 abort ();
625cbd7a 3946 }
c7213af9 3947 break;
625cbd7a 3948 }
e771e7c9 3949 }
c7213af9 3950
56522fc5 3951 if (op >= MAX_OPERANDS)
c7213af9 3952 abort ();
e771e7c9
JB
3953 }
3954
43234a1e
L
3955 switch (i.tm.opcode_modifier.evex)
3956 {
3957 case EVEXLIG: /* LL' is ignored */
3958 vec_length = evexlig << 5;
3959 break;
3960 case EVEX128:
3961 vec_length = 0 << 5;
3962 break;
3963 case EVEX256:
3964 vec_length = 1 << 5;
3965 break;
3966 case EVEX512:
3967 vec_length = 2 << 5;
3968 break;
3969 default:
3970 abort ();
3971 break;
3972 }
3973 i.vex.bytes[3] |= vec_length;
3974 /* Encode the broadcast bit. */
9b345ce8 3975 if (i.broadcast.type || i.broadcast.bytes)
43234a1e
L
3976 i.vex.bytes[3] |= 0x10;
3977 }
ca5312a2
JB
3978 else if (i.rounding.type != saeonly)
3979 i.vex.bytes[3] |= 0x10 | (i.rounding.type << 5);
43234a1e 3980 else
ca5312a2 3981 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
43234a1e 3982
6225c532
JB
3983 if (i.mask.reg)
3984 i.vex.bytes[3] |= i.mask.reg->reg_num;
43234a1e
L
3985}
3986
65da13b5
L
3987static void
3988process_immext (void)
3989{
3990 expressionS *exp;
3991
c0f3af97 3992 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
65da13b5
L
3993 which is coded in the same place as an 8-bit immediate field
3994 would be. Here we fake an 8-bit immediate operand from the
3995 opcode suffix stored in tm.extension_opcode.
3996
c1e679ec 3997 AVX instructions also use this encoding, for some of
c0f3af97 3998 3 argument instructions. */
65da13b5 3999
43234a1e 4000 gas_assert (i.imm_operands <= 1
7ab9ffdd 4001 && (i.operands <= 2
7a8655d2 4002 || (is_any_vex_encoding (&i.tm)
7ab9ffdd 4003 && i.operands <= 4)));
65da13b5
L
4004
4005 exp = &im_expressions[i.imm_operands++];
4006 i.op[i.operands].imms = exp;
be1643ff 4007 i.types[i.operands].bitfield.imm8 = 1;
65da13b5
L
4008 i.operands++;
4009 exp->X_op = O_constant;
4010 exp->X_add_number = i.tm.extension_opcode;
4011 i.tm.extension_opcode = None;
4012}
4013
42164a71
L
4014
4015static int
4016check_hle (void)
4017{
742732c7 4018 switch (i.tm.opcode_modifier.prefixok)
42164a71
L
4019 {
4020 default:
4021 abort ();
742732c7
JB
4022 case PrefixLock:
4023 case PrefixNone:
4024 case PrefixNoTrack:
4025 case PrefixRep:
165de32a 4026 as_bad (_("invalid instruction `%s' after `%s'"),
76d3f746 4027 insn_name (&i.tm), i.hle_prefix);
42164a71 4028 return 0;
742732c7 4029 case PrefixHLELock:
42164a71
L
4030 if (i.prefix[LOCK_PREFIX])
4031 return 1;
165de32a 4032 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
42164a71 4033 return 0;
742732c7 4034 case PrefixHLEAny:
42164a71 4035 return 1;
742732c7 4036 case PrefixHLERelease:
42164a71
L
4037 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4038 {
4039 as_bad (_("instruction `%s' after `xacquire' not allowed"),
76d3f746 4040 insn_name (&i.tm));
42164a71
L
4041 return 0;
4042 }
8dc0818e 4043 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
42164a71
L
4044 {
4045 as_bad (_("memory destination needed for instruction `%s'"
76d3f746 4046 " after `xrelease'"), insn_name (&i.tm));
42164a71
L
4047 return 0;
4048 }
4049 return 1;
4050 }
4051}
4052
c8480b58
L
4053/* Encode aligned vector move as unaligned vector move. */
4054
4055static void
4056encode_with_unaligned_vector_move (void)
4057{
4058 switch (i.tm.base_opcode)
4059 {
b3a9fe6f
L
4060 case 0x28: /* Load instructions. */
4061 case 0x29: /* Store instructions. */
c8480b58 4062 /* movaps/movapd/vmovaps/vmovapd. */
ddb62495 4063 if (i.tm.opcode_space == SPACE_0F
c8480b58 4064 && i.tm.opcode_modifier.opcodeprefix <= PREFIX_0X66)
b3a9fe6f 4065 i.tm.base_opcode = 0x10 | (i.tm.base_opcode & 1);
c8480b58 4066 break;
b3a9fe6f
L
4067 case 0x6f: /* Load instructions. */
4068 case 0x7f: /* Store instructions. */
c8480b58 4069 /* movdqa/vmovdqa/vmovdqa64/vmovdqa32. */
ddb62495 4070 if (i.tm.opcode_space == SPACE_0F
c8480b58
L
4071 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0X66)
4072 i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4073 break;
4074 default:
4075 break;
4076 }
4077}
4078
b6f8c7c4
L
4079/* Try the shortest encoding by shortening operand size. */
4080
4081static void
4082optimize_encoding (void)
4083{
a0a1771e 4084 unsigned int j;
b6f8c7c4 4085
7fc69528 4086 if (i.tm.mnem_off == MN_lea)
fe134c65
JB
4087 {
4088 /* Optimize: -O:
4089 lea symbol, %rN -> mov $symbol, %rN
4090 lea (%rM), %rN -> mov %rM, %rN
4091 lea (,%rM,1), %rN -> mov %rM, %rN
4092
4093 and in 32-bit mode for 16-bit addressing
4094
4095 lea (%rM), %rN -> movzx %rM, %rN
4096
4097 and in 64-bit mode zap 32-bit addressing in favor of using a
4098 32-bit (or less) destination.
4099 */
4100 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4101 {
4102 if (!i.op[1].regs->reg_type.bitfield.word)
4103 i.tm.opcode_modifier.size = SIZE32;
4104 i.prefix[ADDR_PREFIX] = 0;
4105 }
4106
4107 if (!i.index_reg && !i.base_reg)
4108 {
4109 /* Handle:
4110 lea symbol, %rN -> mov $symbol, %rN
4111 */
4112 if (flag_code == CODE_64BIT)
4113 {
4114 /* Don't transform a relocation to a 16-bit one. */
4115 if (i.op[0].disps
4116 && i.op[0].disps->X_op != O_constant
4117 && i.op[1].regs->reg_type.bitfield.word)
4118 return;
4119
4120 if (!i.op[1].regs->reg_type.bitfield.qword
4121 || i.tm.opcode_modifier.size == SIZE32)
4122 {
4123 i.tm.base_opcode = 0xb8;
4124 i.tm.opcode_modifier.modrm = 0;
4125 if (!i.op[1].regs->reg_type.bitfield.word)
4126 i.types[0].bitfield.imm32 = 1;
4127 else
4128 {
4129 i.tm.opcode_modifier.size = SIZE16;
4130 i.types[0].bitfield.imm16 = 1;
4131 }
4132 }
4133 else
4134 {
4135 /* Subject to further optimization below. */
4136 i.tm.base_opcode = 0xc7;
4137 i.tm.extension_opcode = 0;
4138 i.types[0].bitfield.imm32s = 1;
4139 i.types[0].bitfield.baseindex = 0;
4140 }
4141 }
4142 /* Outside of 64-bit mode address and operand sizes have to match if
4143 a relocation is involved, as otherwise we wouldn't (currently) or
4144 even couldn't express the relocation correctly. */
4145 else if (i.op[0].disps
4146 && i.op[0].disps->X_op != O_constant
4147 && ((!i.prefix[ADDR_PREFIX])
4148 != (flag_code == CODE_32BIT
4149 ? i.op[1].regs->reg_type.bitfield.dword
4150 : i.op[1].regs->reg_type.bitfield.word)))
4151 return;
7772f168
JB
4152 /* In 16-bit mode converting LEA with 16-bit addressing and a 32-bit
4153 destination is going to grow encoding size. */
4154 else if (flag_code == CODE_16BIT
4155 && (optimize <= 1 || optimize_for_space)
4156 && !i.prefix[ADDR_PREFIX]
4157 && i.op[1].regs->reg_type.bitfield.dword)
4158 return;
fe134c65
JB
4159 else
4160 {
4161 i.tm.base_opcode = 0xb8;
4162 i.tm.opcode_modifier.modrm = 0;
4163 if (i.op[1].regs->reg_type.bitfield.dword)
4164 i.types[0].bitfield.imm32 = 1;
4165 else
4166 i.types[0].bitfield.imm16 = 1;
4167
4168 if (i.op[0].disps
4169 && i.op[0].disps->X_op == O_constant
4170 && i.op[1].regs->reg_type.bitfield.dword
60cfa10c
L
4171 /* NB: Add () to !i.prefix[ADDR_PREFIX] to silence
4172 GCC 5. */
4173 && (!i.prefix[ADDR_PREFIX]) != (flag_code == CODE_32BIT))
fe134c65
JB
4174 i.op[0].disps->X_add_number &= 0xffff;
4175 }
4176
4177 i.tm.operand_types[0] = i.types[0];
4178 i.imm_operands = 1;
4179 if (!i.op[0].imms)
4180 {
4181 i.op[0].imms = &im_expressions[0];
4182 i.op[0].imms->X_op = O_absent;
4183 }
4184 }
4185 else if (i.op[0].disps
4186 && (i.op[0].disps->X_op != O_constant
4187 || i.op[0].disps->X_add_number))
4188 return;
4189 else
4190 {
4191 /* Handle:
4192 lea (%rM), %rN -> mov %rM, %rN
4193 lea (,%rM,1), %rN -> mov %rM, %rN
4194 lea (%rM), %rN -> movzx %rM, %rN
4195 */
4196 const reg_entry *addr_reg;
4197
4198 if (!i.index_reg && i.base_reg->reg_num != RegIP)
4199 addr_reg = i.base_reg;
4200 else if (!i.base_reg
4201 && i.index_reg->reg_num != RegIZ
4202 && !i.log2_scale_factor)
4203 addr_reg = i.index_reg;
4204 else
4205 return;
4206
4207 if (addr_reg->reg_type.bitfield.word
4208 && i.op[1].regs->reg_type.bitfield.dword)
4209 {
4210 if (flag_code != CODE_32BIT)
4211 return;
ddb62495 4212 i.tm.opcode_space = SPACE_0F;
fe134c65
JB
4213 i.tm.base_opcode = 0xb7;
4214 }
4215 else
4216 i.tm.base_opcode = 0x8b;
4217
4218 if (addr_reg->reg_type.bitfield.dword
4219 && i.op[1].regs->reg_type.bitfield.qword)
4220 i.tm.opcode_modifier.size = SIZE32;
4221
4222 i.op[0].regs = addr_reg;
4223 i.reg_operands = 2;
4224 }
4225
4226 i.mem_operands = 0;
4227 i.disp_operands = 0;
4228 i.prefix[ADDR_PREFIX] = 0;
4229 i.prefix[SEG_PREFIX] = 0;
4230 i.seg[0] = NULL;
4231 }
4232
b6f8c7c4 4233 if (optimize_for_space
7fc69528 4234 && i.tm.mnem_off == MN_test
b6f8c7c4
L
4235 && i.reg_operands == 1
4236 && i.imm_operands == 1
4237 && !i.types[1].bitfield.byte
4238 && i.op[0].imms->X_op == O_constant
7fc69528 4239 && fits_in_imm7 (i.op[0].imms->X_add_number))
b6f8c7c4
L
4240 {
4241 /* Optimize: -Os:
4242 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4243 */
4244 unsigned int base_regnum = i.op[1].regs->reg_num;
4245 if (flag_code == CODE_64BIT || base_regnum < 4)
4246 {
4247 i.types[1].bitfield.byte = 1;
4248 /* Ignore the suffix. */
4249 i.suffix = 0;
7697afb6
JB
4250 /* Convert to byte registers. */
4251 if (i.types[1].bitfield.word)
4252 j = 16;
4253 else if (i.types[1].bitfield.dword)
4254 j = 32;
4255 else
4256 j = 48;
4257 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4258 j += 8;
4259 i.op[1].regs -= j;
b6f8c7c4
L
4260 }
4261 }
4262 else if (flag_code == CODE_64BIT
ddb62495 4263 && i.tm.opcode_space == SPACE_BASE
d3d50934
L
4264 && ((i.types[1].bitfield.qword
4265 && i.reg_operands == 1
b6f8c7c4
L
4266 && i.imm_operands == 1
4267 && i.op[0].imms->X_op == O_constant
507916b8 4268 && ((i.tm.base_opcode == 0xb8
b6f8c7c4
L
4269 && i.tm.extension_opcode == None
4270 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4271 || (fits_in_imm31 (i.op[0].imms->X_add_number)
7fc69528 4272 && (i.tm.base_opcode == 0x24
b6f8c7c4
L
4273 || (i.tm.base_opcode == 0x80
4274 && i.tm.extension_opcode == 0x4)
7fc69528
JB
4275 || i.tm.mnem_off == MN_test
4276 || ((i.tm.base_opcode | 1) == 0xc7
b8364fa7
JB
4277 && i.tm.extension_opcode == 0x0)))
4278 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4279 && i.tm.base_opcode == 0x83
4280 && i.tm.extension_opcode == 0x4)))
d3d50934
L
4281 || (i.types[0].bitfield.qword
4282 && ((i.reg_operands == 2
4283 && i.op[0].regs == i.op[1].regs
7fc69528
JB
4284 && (i.tm.mnem_off == MN_xor
4285 || i.tm.mnem_off == MN_sub))
4286 || i.tm.mnem_off == MN_clr))))
b6f8c7c4
L
4287 {
4288 /* Optimize: -O:
4289 andq $imm31, %r64 -> andl $imm31, %r32
b8364fa7 4290 andq $imm7, %r64 -> andl $imm7, %r32
b6f8c7c4
L
4291 testq $imm31, %r64 -> testl $imm31, %r32
4292 xorq %r64, %r64 -> xorl %r32, %r32
4293 subq %r64, %r64 -> subl %r32, %r32
4294 movq $imm31, %r64 -> movl $imm31, %r32
4295 movq $imm32, %r64 -> movl $imm32, %r32
4296 */
04784e33
JB
4297 i.tm.opcode_modifier.size = SIZE32;
4298 if (i.imm_operands)
4299 {
4300 i.types[0].bitfield.imm32 = 1;
4301 i.types[0].bitfield.imm32s = 0;
4302 i.types[0].bitfield.imm64 = 0;
4303 }
4304 else
4305 {
4306 i.types[0].bitfield.dword = 1;
4307 i.types[0].bitfield.qword = 0;
4308 }
4309 i.types[1].bitfield.dword = 1;
4310 i.types[1].bitfield.qword = 0;
7fc69528 4311 if (i.tm.mnem_off == MN_mov || i.tm.mnem_off == MN_lea)
b6f8c7c4
L
4312 {
4313 /* Handle
4314 movq $imm31, %r64 -> movl $imm31, %r32
4315 movq $imm32, %r64 -> movl $imm32, %r32
4316 */
4317 i.tm.operand_types[0].bitfield.imm32 = 1;
4318 i.tm.operand_types[0].bitfield.imm32s = 0;
4319 i.tm.operand_types[0].bitfield.imm64 = 0;
507916b8 4320 if ((i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4321 {
4322 /* Handle
4323 movq $imm31, %r64 -> movl $imm31, %r32
4324 */
507916b8 4325 i.tm.base_opcode = 0xb8;
b6f8c7c4 4326 i.tm.extension_opcode = None;
507916b8 4327 i.tm.opcode_modifier.w = 0;
b6f8c7c4
L
4328 i.tm.opcode_modifier.modrm = 0;
4329 }
4330 }
4331 }
5641ec01
JB
4332 else if (optimize > 1
4333 && !optimize_for_space
4334 && i.reg_operands == 2
4335 && i.op[0].regs == i.op[1].regs
7fc69528 4336 && (i.tm.mnem_off == MN_and || i.tm.mnem_off == MN_or)
5641ec01
JB
4337 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4338 {
4339 /* Optimize: -O2:
4340 andb %rN, %rN -> testb %rN, %rN
4341 andw %rN, %rN -> testw %rN, %rN
4342 andq %rN, %rN -> testq %rN, %rN
4343 orb %rN, %rN -> testb %rN, %rN
4344 orw %rN, %rN -> testw %rN, %rN
4345 orq %rN, %rN -> testq %rN, %rN
4346
4347 and outside of 64-bit mode
4348
4349 andl %rN, %rN -> testl %rN, %rN
4350 orl %rN, %rN -> testl %rN, %rN
4351 */
4352 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4353 }
ad2f4436
JB
4354 else if (i.tm.base_opcode == 0xba
4355 && i.tm.opcode_space == SPACE_0F
4356 && i.reg_operands == 1
4357 && i.op[0].imms->X_op == O_constant
4358 && i.op[0].imms->X_add_number >= 0)
4359 {
4360 /* Optimize: -O:
4361 btw $n, %rN -> btl $n, %rN (outside of 16-bit mode, n < 16)
4362 btq $n, %rN -> btl $n, %rN (in 64-bit mode, n < 32, N < 8)
4363 btl $n, %rN -> btw $n, %rN (in 16-bit mode, n < 16)
4364
4365 With <BT> one of bts, btr, and bts also:
4366 <BT>w $n, %rN -> btl $n, %rN (in 32-bit mode, n < 16)
4367 <BT>l $n, %rN -> btw $n, %rN (in 16-bit mode, n < 16)
4368 */
4369 switch (flag_code)
4370 {
4371 case CODE_64BIT:
4372 if (i.tm.extension_opcode != 4)
4373 break;
4374 if (i.types[1].bitfield.qword
4375 && i.op[0].imms->X_add_number < 32
4376 && !(i.op[1].regs->reg_flags & RegRex))
4377 i.tm.opcode_modifier.size = SIZE32;
4378 /* Fall through. */
4379 case CODE_32BIT:
4380 if (i.types[1].bitfield.word
4381 && i.op[0].imms->X_add_number < 16)
4382 i.tm.opcode_modifier.size = SIZE32;
4383 break;
4384 case CODE_16BIT:
4385 if (i.op[0].imms->X_add_number < 16)
4386 i.tm.opcode_modifier.size = SIZE16;
4387 break;
4388 }
4389 }
99112332 4390 else if (i.reg_operands == 3
b6f8c7c4
L
4391 && i.op[0].regs == i.op[1].regs
4392 && !i.types[2].bitfield.xmmword
4393 && (i.tm.opcode_modifier.vex
6225c532 4394 || ((!i.mask.reg || i.mask.zeroing)
e771e7c9 4395 && is_evex_encoding (&i.tm)
80c34c38 4396 && (i.vec_encoding != vex_encoding_evex
dd22218c 4397 || cpu_arch_isa_flags.bitfield.cpuavx512vl
80c34c38 4398 || i.tm.cpu_flags.bitfield.cpuavx512vl
7091c612 4399 || (i.tm.operand_types[2].bitfield.zmmword
dd22218c 4400 && i.types[2].bitfield.ymmword))))
ddb62495 4401 && i.tm.opcode_space == SPACE_0F
5844ccaa
JB
4402 && ((i.tm.base_opcode | 2) == 0x57
4403 || i.tm.base_opcode == 0xdf
4404 || i.tm.base_opcode == 0xef
4405 || (i.tm.base_opcode | 3) == 0xfb
4406 || i.tm.base_opcode == 0x42
4407 || i.tm.base_opcode == 0x47))
b6f8c7c4 4408 {
99112332 4409 /* Optimize: -O1:
8305403a
L
4410 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4411 vpsubq and vpsubw:
b6f8c7c4
L
4412 EVEX VOP %zmmM, %zmmM, %zmmN
4413 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4414 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4415 EVEX VOP %ymmM, %ymmM, %ymmN
4416 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4417 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4418 VEX VOP %ymmM, %ymmM, %ymmN
4419 -> VEX VOP %xmmM, %xmmM, %xmmN
4420 VOP, one of vpandn and vpxor:
4421 VEX VOP %ymmM, %ymmM, %ymmN
4422 -> VEX VOP %xmmM, %xmmM, %xmmN
4423 VOP, one of vpandnd and vpandnq:
4424 EVEX VOP %zmmM, %zmmM, %zmmN
4425 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4426 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4427 EVEX VOP %ymmM, %ymmM, %ymmN
4428 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4429 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4430 VOP, one of vpxord and vpxorq:
4431 EVEX VOP %zmmM, %zmmM, %zmmN
4432 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4433 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4434 EVEX VOP %ymmM, %ymmM, %ymmN
4435 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4436 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
1424ad86
JB
4437 VOP, one of kxord and kxorq:
4438 VEX VOP %kM, %kM, %kN
4439 -> VEX kxorw %kM, %kM, %kN
4440 VOP, one of kandnd and kandnq:
4441 VEX VOP %kM, %kM, %kN
4442 -> VEX kandnw %kM, %kM, %kN
b6f8c7c4 4443 */
e771e7c9 4444 if (is_evex_encoding (&i.tm))
b6f8c7c4 4445 {
7b1d7ca1 4446 if (i.vec_encoding != vex_encoding_evex)
b6f8c7c4
L
4447 {
4448 i.tm.opcode_modifier.vex = VEX128;
4449 i.tm.opcode_modifier.vexw = VEXW0;
4450 i.tm.opcode_modifier.evex = 0;
4451 }
7b1d7ca1 4452 else if (optimize > 1)
dd22218c
L
4453 i.tm.opcode_modifier.evex = EVEX128;
4454 else
4455 return;
b6f8c7c4 4456 }
f74a6307 4457 else if (i.tm.operand_types[0].bitfield.class == RegMask)
1424ad86 4458 {
35648716 4459 i.tm.opcode_modifier.opcodeprefix = PREFIX_NONE;
1424ad86
JB
4460 i.tm.opcode_modifier.vexw = VEXW0;
4461 }
b6f8c7c4
L
4462 else
4463 i.tm.opcode_modifier.vex = VEX128;
4464
4465 if (i.tm.opcode_modifier.vex)
4466 for (j = 0; j < 3; j++)
4467 {
4468 i.types[j].bitfield.xmmword = 1;
4469 i.types[j].bitfield.ymmword = 0;
4470 }
4471 }
392a5972 4472 else if (i.vec_encoding != vex_encoding_evex
97ed31ae 4473 && !i.types[0].bitfield.zmmword
392a5972 4474 && !i.types[1].bitfield.zmmword
6225c532 4475 && !i.mask.reg
9b345ce8 4476 && !i.broadcast.type
a5748e0d 4477 && !i.broadcast.bytes
97ed31ae 4478 && is_evex_encoding (&i.tm)
35648716
JB
4479 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4480 || (i.tm.base_opcode & ~4) == 0xdb
4481 || (i.tm.base_opcode & ~4) == 0xeb)
97ed31ae
L
4482 && i.tm.extension_opcode == None)
4483 {
4484 /* Optimize: -O1:
4485 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4486 vmovdqu32 and vmovdqu64:
4487 EVEX VOP %xmmM, %xmmN
4488 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4489 EVEX VOP %ymmM, %ymmN
4490 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4491 EVEX VOP %xmmM, mem
4492 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4493 EVEX VOP %ymmM, mem
4494 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4495 EVEX VOP mem, %xmmN
4496 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4497 EVEX VOP mem, %ymmN
4498 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
a0a1771e
JB
4499 VOP, one of vpand, vpandn, vpor, vpxor:
4500 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4501 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4502 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4503 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4504 EVEX VOP{d,q} mem, %xmmM, %xmmN
4505 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4506 EVEX VOP{d,q} mem, %ymmM, %ymmN
4507 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
97ed31ae 4508 */
a0a1771e 4509 for (j = 0; j < i.operands; j++)
392a5972
L
4510 if (operand_type_check (i.types[j], disp)
4511 && i.op[j].disps->X_op == O_constant)
4512 {
4513 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4514 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4515 bytes, we choose EVEX Disp8 over VEX Disp32. */
4516 int evex_disp8, vex_disp8;
4517 unsigned int memshift = i.memshift;
4518 offsetT n = i.op[j].disps->X_add_number;
4519
4520 evex_disp8 = fits_in_disp8 (n);
4521 i.memshift = 0;
4522 vex_disp8 = fits_in_disp8 (n);
4523 if (evex_disp8 != vex_disp8)
4524 {
4525 i.memshift = memshift;
4526 return;
4527 }
4528
4529 i.types[j].bitfield.disp8 = vex_disp8;
4530 break;
4531 }
35648716
JB
4532 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4533 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2)
4534 i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
97ed31ae
L
4535 i.tm.opcode_modifier.vex
4536 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4537 i.tm.opcode_modifier.vexw = VEXW0;
79dec6b7 4538 /* VPAND, VPOR, and VPXOR are commutative. */
35648716 4539 if (i.reg_operands == 3 && i.tm.base_opcode != 0xdf)
79dec6b7 4540 i.tm.opcode_modifier.commutative = 1;
97ed31ae
L
4541 i.tm.opcode_modifier.evex = 0;
4542 i.tm.opcode_modifier.masking = 0;
a0a1771e 4543 i.tm.opcode_modifier.broadcast = 0;
97ed31ae
L
4544 i.tm.opcode_modifier.disp8memshift = 0;
4545 i.memshift = 0;
a0a1771e
JB
4546 if (j < i.operands)
4547 i.types[j].bitfield.disp8
4548 = fits_in_disp8 (i.op[j].disps->X_add_number);
97ed31ae 4549 }
b6f8c7c4
L
4550}
4551
ae531041
L
4552/* Return non-zero for load instruction. */
4553
4554static int
4555load_insn_p (void)
4556{
4557 unsigned int dest;
4558 int any_vex_p = is_any_vex_encoding (&i.tm);
4559 unsigned int base_opcode = i.tm.base_opcode | 1;
4560
4561 if (!any_vex_p)
4562 {
ef07be45
CL
4563 /* Anysize insns: lea, invlpg, clflush, prefetch*, bndmk, bndcl, bndcu,
4564 bndcn, bndstx, bndldx, clflushopt, clwb, cldemote. */
255571cd 4565 if (i.tm.opcode_modifier.operandconstraint == ANY_SIZE)
ae531041
L
4566 return 0;
4567
389d00a5 4568 /* pop. */
6d86a545 4569 if (i.tm.mnem_off == MN_pop)
389d00a5
JB
4570 return 1;
4571 }
4572
ddb62495 4573 if (i.tm.opcode_space == SPACE_BASE)
389d00a5
JB
4574 {
4575 /* popf, popa. */
4576 if (i.tm.base_opcode == 0x9d
a09f656b 4577 || i.tm.base_opcode == 0x61)
ae531041
L
4578 return 1;
4579
4580 /* movs, cmps, lods, scas. */
4581 if ((i.tm.base_opcode | 0xb) == 0xaf)
4582 return 1;
4583
a09f656b 4584 /* outs, xlatb. */
4585 if (base_opcode == 0x6f
4586 || i.tm.base_opcode == 0xd7)
ae531041 4587 return 1;
a09f656b 4588 /* NB: For AMD-specific insns with implicit memory operands,
4589 they're intentionally not covered. */
ae531041
L
4590 }
4591
4592 /* No memory operand. */
4593 if (!i.mem_operands)
4594 return 0;
4595
4596 if (any_vex_p)
4597 {
7fc69528 4598 if (i.tm.mnem_off == MN_vldmxcsr)
ae531041
L
4599 return 1;
4600 }
ddb62495 4601 else if (i.tm.opcode_space == SPACE_BASE)
ae531041
L
4602 {
4603 /* test, not, neg, mul, imul, div, idiv. */
aa4c197d 4604 if (base_opcode == 0xf7 && i.tm.extension_opcode != 1)
ae531041
L
4605 return 1;
4606
4607 /* inc, dec. */
4608 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4609 return 1;
4610
4611 /* add, or, adc, sbb, and, sub, xor, cmp. */
4612 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4613 return 1;
4614
ae531041 4615 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
aa4c197d 4616 if ((base_opcode == 0xc1 || (base_opcode | 2) == 0xd3)
ae531041
L
4617 && i.tm.extension_opcode != 6)
4618 return 1;
4619
ae531041 4620 /* Check for x87 instructions. */
aa4c197d 4621 if ((base_opcode | 6) == 0xdf)
ae531041
L
4622 {
4623 /* Skip fst, fstp, fstenv, fstcw. */
4624 if (i.tm.base_opcode == 0xd9
4625 && (i.tm.extension_opcode == 2
4626 || i.tm.extension_opcode == 3
4627 || i.tm.extension_opcode == 6
4628 || i.tm.extension_opcode == 7))
4629 return 0;
4630
4631 /* Skip fisttp, fist, fistp, fstp. */
4632 if (i.tm.base_opcode == 0xdb
4633 && (i.tm.extension_opcode == 1
4634 || i.tm.extension_opcode == 2
4635 || i.tm.extension_opcode == 3
4636 || i.tm.extension_opcode == 7))
4637 return 0;
4638
4639 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4640 if (i.tm.base_opcode == 0xdd
4641 && (i.tm.extension_opcode == 1
4642 || i.tm.extension_opcode == 2
4643 || i.tm.extension_opcode == 3
4644 || i.tm.extension_opcode == 6
4645 || i.tm.extension_opcode == 7))
4646 return 0;
4647
4648 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4649 if (i.tm.base_opcode == 0xdf
4650 && (i.tm.extension_opcode == 1
4651 || i.tm.extension_opcode == 2
4652 || i.tm.extension_opcode == 3
4653 || i.tm.extension_opcode == 6
4654 || i.tm.extension_opcode == 7))
4655 return 0;
4656
4657 return 1;
4658 }
4659 }
ddb62495 4660 else if (i.tm.opcode_space == SPACE_0F)
389d00a5
JB
4661 {
4662 /* bt, bts, btr, btc. */
4663 if (i.tm.base_opcode == 0xba
aa4c197d 4664 && (i.tm.extension_opcode | 3) == 7)
389d00a5
JB
4665 return 1;
4666
4667 /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld. */
4668 if (i.tm.base_opcode == 0xc7
4669 && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4670 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4671 || i.tm.extension_opcode == 6))
4672 return 1;
4673
4674 /* fxrstor, ldmxcsr, xrstor. */
4675 if (i.tm.base_opcode == 0xae
4676 && (i.tm.extension_opcode == 1
4677 || i.tm.extension_opcode == 2
4678 || i.tm.extension_opcode == 5))
4679 return 1;
4680
4681 /* lgdt, lidt, lmsw. */
4682 if (i.tm.base_opcode == 0x01
4683 && (i.tm.extension_opcode == 2
4684 || i.tm.extension_opcode == 3
4685 || i.tm.extension_opcode == 6))
4686 return 1;
4687 }
ae531041
L
4688
4689 dest = i.operands - 1;
4690
4691 /* Check fake imm8 operand and 3 source operands. */
4692 if ((i.tm.opcode_modifier.immext
aa180741 4693 || i.reg_operands + i.mem_operands == 4)
ae531041
L
4694 && i.types[dest].bitfield.imm8)
4695 dest--;
4696
389d00a5 4697 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg. */
ddb62495 4698 if (i.tm.opcode_space == SPACE_BASE
aa4c197d 4699 && ((base_opcode | 0x38) == 0x39
389d00a5
JB
4700 || (base_opcode | 2) == 0x87))
4701 return 1;
4702
7fc69528 4703 if (i.tm.mnem_off == MN_xadd)
ae531041
L
4704 return 1;
4705
4706 /* Check for load instruction. */
4707 return (i.types[dest].bitfield.class != ClassNone
4708 || i.types[dest].bitfield.instance == Accum);
4709}
4710
4711/* Output lfence, 0xfaee8, after instruction. */
4712
4713static void
4714insert_lfence_after (void)
4715{
4716 if (lfence_after_load && load_insn_p ())
4717 {
a09f656b 4718 /* There are also two REP string instructions that require
4719 special treatment. Specifically, the compare string (CMPS)
4720 and scan string (SCAS) instructions set EFLAGS in a manner
4721 that depends on the data being compared/scanned. When used
4722 with a REP prefix, the number of iterations may therefore
4723 vary depending on this data. If the data is a program secret
4724 chosen by the adversary using an LVI method,
4725 then this data-dependent behavior may leak some aspect
4726 of the secret. */
aa4c197d 4727 if (((i.tm.base_opcode | 0x9) == 0xaf)
a09f656b 4728 && i.prefix[REP_PREFIX])
4729 {
4730 as_warn (_("`%s` changes flags which would affect control flow behavior"),
76d3f746 4731 insn_name (&i.tm));
a09f656b 4732 }
ae531041
L
4733 char *p = frag_more (3);
4734 *p++ = 0xf;
4735 *p++ = 0xae;
4736 *p = 0xe8;
4737 }
4738}
4739
4740/* Output lfence, 0xfaee8, before instruction. */
4741
4742static void
4743insert_lfence_before (void)
4744{
4745 char *p;
4746
ddb62495 4747 if (i.tm.opcode_space != SPACE_BASE)
ae531041
L
4748 return;
4749
4750 if (i.tm.base_opcode == 0xff
4751 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4752 {
4753 /* Insert lfence before indirect branch if needed. */
4754
4755 if (lfence_before_indirect_branch == lfence_branch_none)
4756 return;
4757
4758 if (i.operands != 1)
4759 abort ();
4760
4761 if (i.reg_operands == 1)
4762 {
4763 /* Indirect branch via register. Don't insert lfence with
4764 -mlfence-after-load=yes. */
4765 if (lfence_after_load
4766 || lfence_before_indirect_branch == lfence_branch_memory)
4767 return;
4768 }
4769 else if (i.mem_operands == 1
4770 && lfence_before_indirect_branch != lfence_branch_register)
4771 {
4772 as_warn (_("indirect `%s` with memory operand should be avoided"),
76d3f746 4773 insn_name (&i.tm));
ae531041
L
4774 return;
4775 }
4776 else
4777 return;
4778
4779 if (last_insn.kind != last_insn_other
4780 && last_insn.seg == now_seg)
4781 {
4782 as_warn_where (last_insn.file, last_insn.line,
4783 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
76d3f746 4784 last_insn.name, insn_name (&i.tm));
ae531041
L
4785 return;
4786 }
4787
4788 p = frag_more (3);
4789 *p++ = 0xf;
4790 *p++ = 0xae;
4791 *p = 0xe8;
4792 return;
4793 }
4794
503648e4 4795 /* Output or/not/shl and lfence before near ret. */
ae531041 4796 if (lfence_before_ret != lfence_before_ret_none
aa4c197d 4797 && (i.tm.base_opcode | 1) == 0xc3)
ae531041
L
4798 {
4799 if (last_insn.kind != last_insn_other
4800 && last_insn.seg == now_seg)
4801 {
4802 as_warn_where (last_insn.file, last_insn.line,
4803 _("`%s` skips -mlfence-before-ret on `%s`"),
76d3f746 4804 last_insn.name, insn_name (&i.tm));
ae531041
L
4805 return;
4806 }
a09f656b 4807
a09f656b 4808 /* Near ret ingore operand size override under CPU64. */
503648e4 4809 char prefix = flag_code == CODE_64BIT
4810 ? 0x48
4811 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
a09f656b 4812
4813 if (lfence_before_ret == lfence_before_ret_not)
4814 {
4815 /* not: 0xf71424, may add prefix
4816 for operand size override or 64-bit code. */
4817 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4818 if (prefix)
4819 *p++ = prefix;
ae531041
L
4820 *p++ = 0xf7;
4821 *p++ = 0x14;
4822 *p++ = 0x24;
a09f656b 4823 if (prefix)
4824 *p++ = prefix;
ae531041
L
4825 *p++ = 0xf7;
4826 *p++ = 0x14;
4827 *p++ = 0x24;
4828 }
a09f656b 4829 else
4830 {
4831 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4832 if (prefix)
4833 *p++ = prefix;
4834 if (lfence_before_ret == lfence_before_ret_or)
4835 {
4836 /* or: 0x830c2400, may add prefix
4837 for operand size override or 64-bit code. */
4838 *p++ = 0x83;
4839 *p++ = 0x0c;
4840 }
4841 else
4842 {
4843 /* shl: 0xc1242400, may add prefix
4844 for operand size override or 64-bit code. */
4845 *p++ = 0xc1;
4846 *p++ = 0x24;
4847 }
4848
4849 *p++ = 0x24;
4850 *p++ = 0x0;
4851 }
4852
ae531041
L
4853 *p++ = 0xf;
4854 *p++ = 0xae;
4855 *p = 0xe8;
4856 }
4857}
4858
04784e33
JB
4859/* Helper for md_assemble() to decide whether to prepare for a possible 2nd
4860 parsing pass. Instead of introducing a rarely use new insn attribute this
4861 utilizes a common pattern between affected templates. It is deemed
4862 acceptable that this will lead to unnecessary pass 2 preparations in a
4863 limited set of cases. */
4864static INLINE bool may_need_pass2 (const insn_template *t)
4865{
4866 return t->opcode_modifier.sse2avx
4867 /* Note that all SSE2AVX templates have at least one operand. */
a28fedbc 4868 ? t->operand_types[t->operands - 1].bitfield.class == RegSIMD
ddb62495 4869 : (t->opcode_space == SPACE_0F
a28fedbc 4870 && (t->base_opcode | 1) == 0xbf)
ddb62495 4871 || (t->opcode_space == SPACE_BASE
a28fedbc 4872 && t->base_opcode == 0x63);
04784e33
JB
4873}
4874
252b5132
RH
4875/* This is the guts of the machine-dependent assembler. LINE points to a
4876 machine dependent instruction. This function is supposed to emit
4877 the frags/bytes it assembles to. */
4878
4879void
65da13b5 4880md_assemble (char *line)
252b5132 4881{
40fb9820 4882 unsigned int j;
9db83a32 4883 char mnemonic[MAX_MNEM_SIZE], mnem_suffix = 0, *copy = NULL;
04784e33
JB
4884 const char *end, *pass1_mnem = NULL;
4885 enum i386_error pass1_err = 0;
d3ce72d0 4886 const insn_template *t;
252b5132 4887
47926f60 4888 /* Initialize globals. */
04784e33
JB
4889 current_templates = NULL;
4890 retry:
252b5132 4891 memset (&i, '\0', sizeof (i));
ca5312a2 4892 i.rounding.type = rc_none;
252b5132 4893 for (j = 0; j < MAX_OPERANDS; j++)
1ae12ab7 4894 i.reloc[j] = NO_RELOC;
252b5132
RH
4895 memset (disp_expressions, '\0', sizeof (disp_expressions));
4896 memset (im_expressions, '\0', sizeof (im_expressions));
ce8a8b2f 4897 save_stack_p = save_stack;
252b5132
RH
4898
4899 /* First parse an instruction mnemonic & call i386_operand for the operands.
4900 We assume that the scrubber has arranged it so that line[0] is the valid
47926f60 4901 start of a (possibly prefixed) mnemonic. */
252b5132 4902
5317ad2c
JB
4903 end = parse_insn (line, mnemonic);
4904 if (end == NULL)
04784e33
JB
4905 {
4906 if (pass1_mnem != NULL)
4907 goto match_error;
9db83a32
JB
4908 if (i.error != no_error)
4909 {
4910 gas_assert (current_templates != NULL);
4911 if (may_need_pass2 (current_templates->start) && !i.suffix)
4912 goto no_match;
4913 /* No point in trying a 2nd pass - it'll only find the same suffix
4914 again. */
4915 mnem_suffix = i.suffix;
4916 goto match_error;
4917 }
04784e33
JB
4918 return;
4919 }
6d86a545
JB
4920 t = current_templates->start;
4921 if (may_need_pass2 (t))
04784e33
JB
4922 {
4923 /* Make a copy of the full line in case we need to retry. */
4924 copy = xstrdup (line);
4925 }
5317ad2c 4926 line += end - line;
83b16ac6 4927 mnem_suffix = i.suffix;
252b5132 4928
29b0f896 4929 line = parse_operands (line, mnemonic);
ee86248c 4930 this_operand = -1;
29b0f896 4931 if (line == NULL)
04784e33
JB
4932 {
4933 free (copy);
4934 return;
4935 }
252b5132 4936
29b0f896
AM
4937 /* Now we've parsed the mnemonic into a set of templates, and have the
4938 operands at hand. */
4939
b630c145 4940 /* All Intel opcodes have reversed operands except for "bound", "enter",
c0e54661 4941 "invlpg*", "monitor*", "mwait*", "tpause", "umwait", "pvalidate",
b0e8fa7f
TJ
4942 "rmpadjust", "rmpupdate", and "rmpquery". We also don't reverse
4943 intersegment "jmp" and "call" instructions with 2 immediate operands so
4944 that the immediate segment precedes the offset consistently in Intel and
4945 AT&T modes. */
4d456e3d
L
4946 if (intel_syntax
4947 && i.operands > 1
6d86a545
JB
4948 && (t->mnem_off != MN_bound)
4949 && !startswith (mnemonic, "invlpg")
d34049e8
ML
4950 && !startswith (mnemonic, "monitor")
4951 && !startswith (mnemonic, "mwait")
6d86a545 4952 && (t->mnem_off != MN_pvalidate)
d34049e8 4953 && !startswith (mnemonic, "rmp")
6d86a545
JB
4954 && (t->mnem_off != MN_tpause)
4955 && (t->mnem_off != MN_umwait)
47c0279b
JB
4956 && !(i.operands == 2
4957 && operand_type_check (i.types[0], imm)
40fb9820 4958 && operand_type_check (i.types[1], imm)))
29b0f896
AM
4959 swap_operands ();
4960
ec56d5c0
JB
4961 /* The order of the immediates should be reversed
4962 for 2 immediates extrq and insertq instructions */
4963 if (i.imm_operands == 2
6d86a545 4964 && (t->mnem_off == MN_extrq || t->mnem_off == MN_insertq))
ec56d5c0
JB
4965 swap_2_operands (0, 1);
4966
29b0f896
AM
4967 if (i.imm_operands)
4968 optimize_imm ();
4969
0de704b9
JB
4970 if (i.disp_operands && !optimize_disp (t))
4971 return;
29b0f896
AM
4972
4973 /* Next, we find a template that matches the given insn,
4974 making sure the overlap of the given operands types is consistent
4975 with the template operand types. */
252b5132 4976
83b16ac6 4977 if (!(t = match_template (mnem_suffix)))
04784e33
JB
4978 {
4979 const char *err_msg;
4980
4981 if (copy && !mnem_suffix)
4982 {
4983 line = copy;
4984 copy = NULL;
9db83a32 4985 no_match:
04784e33 4986 pass1_err = i.error;
76d3f746 4987 pass1_mnem = insn_name (current_templates->start);
04784e33
JB
4988 goto retry;
4989 }
9db83a32
JB
4990
4991 /* If a non-/only-64bit template (group) was found in pass 1, and if
4992 _some_ template (group) was found in pass 2, squash pass 1's
4993 error. */
4994 if (pass1_err == unsupported_64bit)
4995 pass1_mnem = NULL;
4996
04784e33 4997 match_error:
9db83a32
JB
4998 free (copy);
4999
04784e33
JB
5000 switch (pass1_mnem ? pass1_err : i.error)
5001 {
5002 default:
5003 abort ();
5004 case operand_size_mismatch:
5005 err_msg = _("operand size mismatch");
5006 break;
5007 case operand_type_mismatch:
5008 err_msg = _("operand type mismatch");
5009 break;
5010 case register_type_mismatch:
5011 err_msg = _("register type mismatch");
5012 break;
5013 case number_of_operands_mismatch:
5014 err_msg = _("number of operands mismatch");
5015 break;
5016 case invalid_instruction_suffix:
5017 err_msg = _("invalid instruction suffix");
5018 break;
5019 case bad_imm4:
5020 err_msg = _("constant doesn't fit in 4 bits");
5021 break;
5022 case unsupported_with_intel_mnemonic:
5023 err_msg = _("unsupported with Intel mnemonic");
5024 break;
5025 case unsupported_syntax:
5026 err_msg = _("unsupported syntax");
5027 break;
5028 case unsupported:
5029 as_bad (_("unsupported instruction `%s'"),
76d3f746 5030 pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
04784e33 5031 return;
9db83a32
JB
5032 case unsupported_on_arch:
5033 as_bad (_("`%s' is not supported on `%s%s'"),
76d3f746 5034 pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
9db83a32
JB
5035 cpu_arch_name ? cpu_arch_name : default_arch,
5036 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5037 return;
5038 case unsupported_64bit:
5039 if (ISLOWER (mnem_suffix))
e8b4b7b2
NC
5040 {
5041 if (flag_code == CODE_64BIT)
5042 as_bad (_("`%s%c' is not supported in 64-bit mode"),
76d3f746 5043 pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
e8b4b7b2
NC
5044 mnem_suffix);
5045 else
5046 as_bad (_("`%s%c' is only supported in 64-bit mode"),
76d3f746 5047 pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
e8b4b7b2
NC
5048 mnem_suffix);
5049 }
9db83a32 5050 else
e8b4b7b2
NC
5051 {
5052 if (flag_code == CODE_64BIT)
5053 as_bad (_("`%s' is not supported in 64-bit mode"),
76d3f746 5054 pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
e8b4b7b2
NC
5055 else
5056 as_bad (_("`%s' is only supported in 64-bit mode"),
76d3f746 5057 pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
e8b4b7b2 5058 }
9db83a32 5059 return;
04784e33
JB
5060 case invalid_sib_address:
5061 err_msg = _("invalid SIB address");
5062 break;
5063 case invalid_vsib_address:
5064 err_msg = _("invalid VSIB address");
5065 break;
5066 case invalid_vector_register_set:
5067 err_msg = _("mask, index, and destination registers must be distinct");
5068 break;
5069 case invalid_tmm_register_set:
5070 err_msg = _("all tmm registers must be distinct");
5071 break;
5072 case invalid_dest_and_src_register_set:
5073 err_msg = _("destination and source registers must be distinct");
5074 break;
5075 case unsupported_vector_index_register:
5076 err_msg = _("unsupported vector index register");
5077 break;
5078 case unsupported_broadcast:
5079 err_msg = _("unsupported broadcast");
5080 break;
5081 case broadcast_needed:
5082 err_msg = _("broadcast is needed for operand of such type");
5083 break;
5084 case unsupported_masking:
5085 err_msg = _("unsupported masking");
5086 break;
5087 case mask_not_on_destination:
5088 err_msg = _("mask not on destination operand");
5089 break;
5090 case no_default_mask:
5091 err_msg = _("default mask isn't allowed");
5092 break;
5093 case unsupported_rc_sae:
5094 err_msg = _("unsupported static rounding/sae");
5095 break;
5096 case invalid_register_operand:
5097 err_msg = _("invalid register operand");
5098 break;
5099 }
5100 as_bad (_("%s for `%s'"), err_msg,
76d3f746 5101 pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
04784e33
JB
5102 return;
5103 }
5104
5105 free (copy);
252b5132 5106
7bab8ab5 5107 if (sse_check != check_none
ffb86450
JB
5108 /* The opcode space check isn't strictly needed; it's there only to
5109 bypass the logic below when easily possible. */
ddb62495
JB
5110 && t->opcode_space >= SPACE_0F
5111 && t->opcode_space <= SPACE_0F3A
ffb86450
JB
5112 && !i.tm.cpu_flags.bitfield.cpusse4a
5113 && !is_any_vex_encoding (t))
daf50ae7 5114 {
ffb86450
JB
5115 bool simd = false;
5116
5117 for (j = 0; j < t->operands; ++j)
5118 {
5119 if (t->operand_types[j].bitfield.class == RegMMX)
5120 break;
5121 if (t->operand_types[j].bitfield.class == RegSIMD)
5122 simd = true;
5123 }
5124
5125 if (j >= t->operands && simd)
5126 (sse_check == check_warning
5127 ? as_warn
76d3f746 5128 : as_bad) (_("SSE instruction `%s' is used"), insn_name (&i.tm));
daf50ae7
L
5129 }
5130
40fb9820 5131 if (i.tm.opcode_modifier.fwait)
29b0f896
AM
5132 if (!add_prefix (FWAIT_OPCODE))
5133 return;
252b5132 5134
d5de92cf 5135 /* Check if REP prefix is OK. */
742732c7 5136 if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
d5de92cf
L
5137 {
5138 as_bad (_("invalid instruction `%s' after `%s'"),
76d3f746 5139 insn_name (&i.tm), i.rep_prefix);
d5de92cf
L
5140 return;
5141 }
5142
c1ba0266
L
5143 /* Check for lock without a lockable instruction. Destination operand
5144 must be memory unless it is xchg (0x86). */
9a4a4499
JB
5145 if (i.prefix[LOCK_PREFIX])
5146 {
5147 if (i.tm.opcode_modifier.prefixok < PrefixLock
c1ba0266
L
5148 || i.mem_operands == 0
5149 || (i.tm.base_opcode != 0x86
9a4a4499
JB
5150 && !(i.flags[i.operands - 1] & Operand_Mem)))
5151 {
5152 as_bad (_("expecting lockable instruction after `lock'"));
5153 return;
5154 }
5155
5156 /* Zap the redundant prefix from XCHG when optimizing. */
5157 if (i.tm.base_opcode == 0x86 && optimize && !i.no_optimize)
5158 i.prefix[LOCK_PREFIX] = 0;
c32fa91d
L
5159 }
5160
e3669c7f
JB
5161 if (is_any_vex_encoding (&i.tm)
5162 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
5163 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX)
7a8655d2 5164 {
e3669c7f
JB
5165 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
5166 if (i.prefix[DATA_PREFIX])
5167 {
76d3f746 5168 as_bad (_("data size prefix invalid with `%s'"), insn_name (&i.tm));
e3669c7f
JB
5169 return;
5170 }
5171
5172 /* Don't allow e.g. KMOV in TLS code sequences. */
5173 for (j = i.imm_operands; j < i.operands; ++j)
5174 switch (i.reloc[j])
5175 {
5176 case BFD_RELOC_386_TLS_GOTIE:
5177 case BFD_RELOC_386_TLS_LE_32:
5178 case BFD_RELOC_X86_64_GOTTPOFF:
5179 case BFD_RELOC_X86_64_TLSLD:
76d3f746 5180 as_bad (_("TLS relocation cannot be used with `%s'"), insn_name (&i.tm));
e3669c7f
JB
5181 return;
5182 default:
5183 break;
5184 }
7a8655d2
JB
5185 }
5186
42164a71 5187 /* Check if HLE prefix is OK. */
165de32a 5188 if (i.hle_prefix && !check_hle ())
42164a71
L
5189 return;
5190
7e8b059b
L
5191 /* Check BND prefix. */
5192 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
5193 as_bad (_("expecting valid branch instruction after `bnd'"));
5194
04ef582a 5195 /* Check NOTRACK prefix. */
742732c7 5196 if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
9fef80d6 5197 as_bad (_("expecting indirect branch instruction after `notrack'"));
04ef582a 5198
327e8c42
JB
5199 if (i.tm.cpu_flags.bitfield.cpumpx)
5200 {
5201 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
5202 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
5203 else if (flag_code != CODE_16BIT
5204 ? i.prefix[ADDR_PREFIX]
5205 : i.mem_operands && !i.prefix[ADDR_PREFIX])
5206 as_bad (_("16-bit address isn't allowed in MPX instructions"));
5207 }
7e8b059b
L
5208
5209 /* Insert BND prefix. */
76d3a78a
JB
5210 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
5211 {
5212 if (!i.prefix[BND_PREFIX])
5213 add_prefix (BND_PREFIX_OPCODE);
5214 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
5215 {
5216 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
5217 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
5218 }
5219 }
7e8b059b 5220
29b0f896 5221 /* Check string instruction segment overrides. */
51c8edf6 5222 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
29b0f896 5223 {
51c8edf6 5224 gas_assert (i.mem_operands);
29b0f896 5225 if (!check_string ())
5dd0794d 5226 return;
fc0763e6 5227 i.disp_operands = 0;
29b0f896 5228 }
5dd0794d 5229
9373f275
L
5230 /* The memory operand of (%dx) should be only used with input/output
5231 instructions (base opcodes: 0x6c, 0x6e, 0xec, 0xee). */
5232 if (i.input_output_operand
5233 && ((i.tm.base_opcode | 0x82) != 0xee
ddb62495 5234 || i.tm.opcode_space != SPACE_BASE))
9373f275
L
5235 {
5236 as_bad (_("input/output port address isn't allowed with `%s'"),
76d3f746 5237 insn_name (&i.tm));
9373f275
L
5238 return;
5239 }
5240
b6f8c7c4
L
5241 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
5242 optimize_encoding ();
5243
c8480b58
L
5244 if (use_unaligned_vector_move)
5245 encode_with_unaligned_vector_move ();
5246
29b0f896
AM
5247 if (!process_suffix ())
5248 return;
e413e4e9 5249
ef07be45
CL
5250 /* Check if IP-relative addressing requirements can be satisfied. */
5251 if (i.tm.cpu_flags.bitfield.cpuprefetchi
5252 && !(i.base_reg && i.base_reg->reg_num == RegIP))
76d3f746 5253 as_warn (_("'%s' only supports RIP-relative address"), insn_name (&i.tm));
ef07be45 5254
921eafea 5255 /* Update operand types and check extended states. */
bc0844ae 5256 for (j = 0; j < i.operands; j++)
921eafea
L
5257 {
5258 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3d70986f 5259 switch (i.tm.operand_types[j].bitfield.class)
921eafea
L
5260 {
5261 default:
5262 break;
5263 case RegMMX:
5264 i.xstate |= xstate_mmx;
5265 break;
5266 case RegMask:
32930e4e 5267 i.xstate |= xstate_mask;
921eafea
L
5268 break;
5269 case RegSIMD:
3d70986f 5270 if (i.tm.operand_types[j].bitfield.tmmword)
921eafea 5271 i.xstate |= xstate_tmm;
3d70986f 5272 else if (i.tm.operand_types[j].bitfield.zmmword)
921eafea 5273 i.xstate |= xstate_zmm;
3d70986f 5274 else if (i.tm.operand_types[j].bitfield.ymmword)
921eafea 5275 i.xstate |= xstate_ymm;
3d70986f 5276 else if (i.tm.operand_types[j].bitfield.xmmword)
921eafea
L
5277 i.xstate |= xstate_xmm;
5278 break;
5279 }
5280 }
bc0844ae 5281
29b0f896
AM
5282 /* Make still unresolved immediate matches conform to size of immediate
5283 given in i.suffix. */
5284 if (!finalize_imm ())
5285 return;
252b5132 5286
40fb9820 5287 if (i.types[0].bitfield.imm1)
29b0f896 5288 i.imm_operands = 0; /* kludge for shift insns. */
252b5132 5289
29b0f896
AM
5290 /* For insns with operands there are more diddles to do to the opcode. */
5291 if (i.operands)
5292 {
5293 if (!process_operands ())
5294 return;
5295 }
255571cd 5296 else if (!quiet_warnings && i.tm.opcode_modifier.operandconstraint == UGH)
29b0f896
AM
5297 {
5298 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
76d3f746 5299 as_warn (_("translating to `%sp'"), insn_name (&i.tm));
29b0f896 5300 }
252b5132 5301
7a8655d2 5302 if (is_any_vex_encoding (&i.tm))
9e5e5283 5303 {
c1dc7af5 5304 if (!cpu_arch_flags.bitfield.cpui286)
9e5e5283 5305 {
c1dc7af5 5306 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
76d3f746 5307 insn_name (&i.tm));
9e5e5283
L
5308 return;
5309 }
c0f3af97 5310
0b9404fd
JB
5311 /* Check for explicit REX prefix. */
5312 if (i.prefix[REX_PREFIX] || i.rex_encoding)
5313 {
76d3f746 5314 as_bad (_("REX prefix invalid with `%s'"), insn_name (&i.tm));
0b9404fd
JB
5315 return;
5316 }
5317
9e5e5283
L
5318 if (i.tm.opcode_modifier.vex)
5319 build_vex_prefix (t);
5320 else
5321 build_evex_prefix ();
0b9404fd
JB
5322
5323 /* The individual REX.RXBW bits got consumed. */
5324 i.rex &= REX_OPCODE;
9e5e5283 5325 }
43234a1e 5326
7fc69528
JB
5327 /* Handle conversion of 'int $3' --> special int3 insn. */
5328 if (i.tm.mnem_off == MN_int
a6461c02 5329 && i.op[0].imms->X_add_number == 3)
29b0f896
AM
5330 {
5331 i.tm.base_opcode = INT3_OPCODE;
5332 i.imm_operands = 0;
5333 }
252b5132 5334
0cfa3eb3
JB
5335 if ((i.tm.opcode_modifier.jump == JUMP
5336 || i.tm.opcode_modifier.jump == JUMP_BYTE
5337 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896
AM
5338 && i.op[0].disps->X_op == O_constant)
5339 {
5340 /* Convert "jmp constant" (and "call constant") to a jump (call) to
5341 the absolute address given by the constant. Since ix86 jumps and
5342 calls are pc relative, we need to generate a reloc. */
5343 i.op[0].disps->X_add_symbol = &abs_symbol;
5344 i.op[0].disps->X_op = O_symbol;
5345 }
252b5132 5346
29b0f896
AM
5347 /* For 8 bit registers we need an empty rex prefix. Also if the
5348 instruction already has a prefix, we need to convert old
5349 registers to new ones. */
773f551c 5350
bab6aec1 5351 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
29b0f896 5352 && (i.op[0].regs->reg_flags & RegRex64) != 0)
bab6aec1 5353 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
29b0f896 5354 && (i.op[1].regs->reg_flags & RegRex64) != 0)
bab6aec1
JB
5355 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
5356 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
29b0f896
AM
5357 && i.rex != 0))
5358 {
5359 int x;
726c5dcd 5360
29b0f896
AM
5361 i.rex |= REX_OPCODE;
5362 for (x = 0; x < 2; x++)
5363 {
5364 /* Look for 8 bit operand that uses old registers. */
bab6aec1 5365 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
29b0f896 5366 && (i.op[x].regs->reg_flags & RegRex64) == 0)
773f551c 5367 {
3f93af61 5368 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
29b0f896
AM
5369 /* In case it is "hi" register, give up. */
5370 if (i.op[x].regs->reg_num > 3)
a540244d 5371 as_bad (_("can't encode register '%s%s' in an "
4eed87de 5372 "instruction requiring REX prefix."),
a540244d 5373 register_prefix, i.op[x].regs->reg_name);
773f551c 5374
29b0f896
AM
5375 /* Otherwise it is equivalent to the extended register.
5376 Since the encoding doesn't change this is merely
5377 cosmetic cleanup for debug output. */
5378
5379 i.op[x].regs = i.op[x].regs + 8;
773f551c 5380 }
29b0f896
AM
5381 }
5382 }
773f551c 5383
6b6b6807
L
5384 if (i.rex == 0 && i.rex_encoding)
5385 {
5386 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
3f93af61 5387 that uses legacy register. If it is "hi" register, don't add
6b6b6807
L
5388 the REX_OPCODE byte. */
5389 int x;
5390 for (x = 0; x < 2; x++)
bab6aec1 5391 if (i.types[x].bitfield.class == Reg
6b6b6807
L
5392 && i.types[x].bitfield.byte
5393 && (i.op[x].regs->reg_flags & RegRex64) == 0
5394 && i.op[x].regs->reg_num > 3)
5395 {
3f93af61 5396 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5b7c81bd 5397 i.rex_encoding = false;
6b6b6807
L
5398 break;
5399 }
5400
5401 if (i.rex_encoding)
5402 i.rex = REX_OPCODE;
5403 }
5404
7ab9ffdd 5405 if (i.rex != 0)
29b0f896
AM
5406 add_prefix (REX_OPCODE | i.rex);
5407
ae531041
L
5408 insert_lfence_before ();
5409
29b0f896
AM
5410 /* We are ready to output the insn. */
5411 output_insn ();
e379e5f3 5412
ae531041
L
5413 insert_lfence_after ();
5414
e379e5f3
L
5415 last_insn.seg = now_seg;
5416
5417 if (i.tm.opcode_modifier.isprefix)
5418 {
5419 last_insn.kind = last_insn_prefix;
76d3f746 5420 last_insn.name = insn_name (&i.tm);
e379e5f3
L
5421 last_insn.file = as_where (&last_insn.line);
5422 }
5423 else
5424 last_insn.kind = last_insn_other;
29b0f896
AM
5425}
5426
9db83a32
JB
5427/* The Q suffix is generally valid only in 64-bit mode, with very few
5428 exceptions: fild, fistp, fisttp, and cmpxchg8b. Note that for fild
5429 and fisttp only one of their two templates is matched below: That's
5430 sufficient since other relevant attributes are the same between both
5431 respective templates. */
5432static INLINE bool q_suffix_allowed(const insn_template *t)
5433{
5434 return flag_code == CODE_64BIT
ddb62495 5435 || (t->opcode_space == SPACE_BASE
9db83a32
JB
5436 && t->base_opcode == 0xdf
5437 && (t->extension_opcode & 1)) /* fild / fistp / fisttp */
7fc69528 5438 || t->mnem_off == MN_cmpxchg8b;
9db83a32
JB
5439}
5440
5317ad2c
JB
5441static const char *
5442parse_insn (const char *line, char *mnemonic)
29b0f896 5443{
5317ad2c 5444 const char *l = line, *token_start = l;
29b0f896 5445 char *mnem_p;
04784e33 5446 bool pass1 = !current_templates;
5c6af06e 5447 int supported;
d3ce72d0 5448 const insn_template *t;
b6169b20 5449 char *dot_p = NULL;
29b0f896 5450
29b0f896
AM
5451 while (1)
5452 {
5453 mnem_p = mnemonic;
5454 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5455 {
b6169b20
L
5456 if (*mnem_p == '.')
5457 dot_p = mnem_p;
29b0f896
AM
5458 mnem_p++;
5459 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
45288df1 5460 {
29b0f896
AM
5461 as_bad (_("no such instruction: `%s'"), token_start);
5462 return NULL;
5463 }
5464 l++;
5465 }
5466 if (!is_space_char (*l)
5467 && *l != END_OF_INSN
e44823cf
JB
5468 && (intel_syntax
5469 || (*l != PREFIX_SEPARATOR
5470 && *l != ',')))
29b0f896
AM
5471 {
5472 as_bad (_("invalid character %s in mnemonic"),
5473 output_invalid (*l));
5474 return NULL;
5475 }
5476 if (token_start == l)
5477 {
e44823cf 5478 if (!intel_syntax && *l == PREFIX_SEPARATOR)
29b0f896
AM
5479 as_bad (_("expecting prefix; got nothing"));
5480 else
5481 as_bad (_("expecting mnemonic; got nothing"));
5482 return NULL;
5483 }
45288df1 5484
29b0f896 5485 /* Look up instruction (or prefix) via hash table. */
629310ab 5486 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
47926f60 5487
29b0f896
AM
5488 if (*l != END_OF_INSN
5489 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5490 && current_templates
40fb9820 5491 && current_templates->start->opcode_modifier.isprefix)
29b0f896 5492 {
c6fb90c8 5493 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
2dd88dca
JB
5494 {
5495 as_bad ((flag_code != CODE_64BIT
5496 ? _("`%s' is only supported in 64-bit mode")
5497 : _("`%s' is not supported in 64-bit mode")),
76d3f746 5498 insn_name (current_templates->start));
2dd88dca
JB
5499 return NULL;
5500 }
29b0f896
AM
5501 /* If we are in 16-bit mode, do not allow addr16 or data16.
5502 Similarly, in 32-bit mode, do not allow addr32 or data32. */
673fe0f0
JB
5503 if ((current_templates->start->opcode_modifier.size == SIZE16
5504 || current_templates->start->opcode_modifier.size == SIZE32)
29b0f896 5505 && flag_code != CODE_64BIT
673fe0f0 5506 && ((current_templates->start->opcode_modifier.size == SIZE32)
29b0f896
AM
5507 ^ (flag_code == CODE_16BIT)))
5508 {
5509 as_bad (_("redundant %s prefix"),
76d3f746 5510 insn_name (current_templates->start));
29b0f896 5511 return NULL;
45288df1 5512 }
31184569
JB
5513
5514 if (current_templates->start->base_opcode == PSEUDO_PREFIX)
29b0f896 5515 {
86fa6981 5516 /* Handle pseudo prefixes. */
31184569 5517 switch (current_templates->start->extension_opcode)
86fa6981 5518 {
41eb8e88 5519 case Prefix_Disp8:
86fa6981
L
5520 /* {disp8} */
5521 i.disp_encoding = disp_encoding_8bit;
5522 break;
41eb8e88
L
5523 case Prefix_Disp16:
5524 /* {disp16} */
5525 i.disp_encoding = disp_encoding_16bit;
5526 break;
5527 case Prefix_Disp32:
86fa6981
L
5528 /* {disp32} */
5529 i.disp_encoding = disp_encoding_32bit;
5530 break;
41eb8e88 5531 case Prefix_Load:
86fa6981
L
5532 /* {load} */
5533 i.dir_encoding = dir_encoding_load;
5534 break;
41eb8e88 5535 case Prefix_Store:
86fa6981
L
5536 /* {store} */
5537 i.dir_encoding = dir_encoding_store;
5538 break;
41eb8e88 5539 case Prefix_VEX:
42e04b36
L
5540 /* {vex} */
5541 i.vec_encoding = vex_encoding_vex;
86fa6981 5542 break;
41eb8e88 5543 case Prefix_VEX3:
86fa6981
L
5544 /* {vex3} */
5545 i.vec_encoding = vex_encoding_vex3;
5546 break;
41eb8e88 5547 case Prefix_EVEX:
86fa6981
L
5548 /* {evex} */
5549 i.vec_encoding = vex_encoding_evex;
5550 break;
41eb8e88 5551 case Prefix_REX:
6b6b6807 5552 /* {rex} */
5b7c81bd 5553 i.rex_encoding = true;
6b6b6807 5554 break;
41eb8e88 5555 case Prefix_NoOptimize:
b6f8c7c4 5556 /* {nooptimize} */
5b7c81bd 5557 i.no_optimize = true;
b6f8c7c4 5558 break;
86fa6981
L
5559 default:
5560 abort ();
5561 }
5562 }
5563 else
5564 {
5565 /* Add prefix, checking for repeated prefixes. */
4e9ac44a 5566 switch (add_prefix (current_templates->start->base_opcode))
86fa6981 5567 {
4e9ac44a
L
5568 case PREFIX_EXIST:
5569 return NULL;
5570 case PREFIX_DS:
d777820b 5571 if (current_templates->start->cpu_flags.bitfield.cpuibt)
76d3f746 5572 i.notrack_prefix = insn_name (current_templates->start);
4e9ac44a
L
5573 break;
5574 case PREFIX_REP:
5575 if (current_templates->start->cpu_flags.bitfield.cpuhle)
76d3f746 5576 i.hle_prefix = insn_name (current_templates->start);
4e9ac44a 5577 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
76d3f746 5578 i.bnd_prefix = insn_name (current_templates->start);
4e9ac44a 5579 else
76d3f746 5580 i.rep_prefix = insn_name (current_templates->start);
4e9ac44a
L
5581 break;
5582 default:
5583 break;
86fa6981 5584 }
29b0f896
AM
5585 }
5586 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5587 token_start = ++l;
5588 }
5589 else
5590 break;
5591 }
45288df1 5592
30a55f88 5593 if (!current_templates)
b6169b20 5594 {
07d5e953
JB
5595 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5596 Check if we should swap operand or force 32bit displacement in
f8a5c266 5597 encoding. */
30a55f88 5598 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
64c49ab3 5599 i.dir_encoding = dir_encoding_swap;
8d63c93e 5600 else if (mnem_p - 3 == dot_p
a501d77e
L
5601 && dot_p[1] == 'd'
5602 && dot_p[2] == '8')
5603 i.disp_encoding = disp_encoding_8bit;
8d63c93e 5604 else if (mnem_p - 4 == dot_p
f8a5c266
L
5605 && dot_p[1] == 'd'
5606 && dot_p[2] == '3'
5607 && dot_p[3] == '2')
a501d77e 5608 i.disp_encoding = disp_encoding_32bit;
30a55f88
L
5609 else
5610 goto check_suffix;
5611 mnem_p = dot_p;
5612 *dot_p = '\0';
629310ab 5613 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
b6169b20
L
5614 }
5615
04784e33 5616 if (!current_templates || !pass1)
29b0f896 5617 {
04784e33
JB
5618 current_templates = NULL;
5619
dc1e8a47 5620 check_suffix:
1c529385 5621 if (mnem_p > mnemonic)
29b0f896 5622 {
1c529385
LH
5623 /* See if we can get a match by trimming off a suffix. */
5624 switch (mnem_p[-1])
29b0f896 5625 {
1c529385
LH
5626 case WORD_MNEM_SUFFIX:
5627 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
29b0f896
AM
5628 i.suffix = SHORT_MNEM_SUFFIX;
5629 else
1c529385
LH
5630 /* Fall through. */
5631 case BYTE_MNEM_SUFFIX:
5632 case QWORD_MNEM_SUFFIX:
5633 i.suffix = mnem_p[-1];
29b0f896 5634 mnem_p[-1] = '\0';
fe0e921f
AM
5635 current_templates
5636 = (const templates *) str_hash_find (op_hash, mnemonic);
1c529385
LH
5637 break;
5638 case SHORT_MNEM_SUFFIX:
5639 case LONG_MNEM_SUFFIX:
5640 if (!intel_syntax)
5641 {
5642 i.suffix = mnem_p[-1];
5643 mnem_p[-1] = '\0';
fe0e921f
AM
5644 current_templates
5645 = (const templates *) str_hash_find (op_hash, mnemonic);
1c529385
LH
5646 }
5647 break;
5648
5649 /* Intel Syntax. */
5650 case 'd':
5651 if (intel_syntax)
5652 {
5653 if (intel_float_operand (mnemonic) == 1)
5654 i.suffix = SHORT_MNEM_SUFFIX;
5655 else
5656 i.suffix = LONG_MNEM_SUFFIX;
5657 mnem_p[-1] = '\0';
fe0e921f
AM
5658 current_templates
5659 = (const templates *) str_hash_find (op_hash, mnemonic);
1c529385 5660 }
04784e33
JB
5661 /* For compatibility reasons accept MOVSD and CMPSD without
5662 operands even in AT&T mode. */
5663 else if (*l == END_OF_INSN
5664 || (is_space_char (*l) && l[1] == END_OF_INSN))
5665 {
5666 mnem_p[-1] = '\0';
5667 current_templates
5668 = (const templates *) str_hash_find (op_hash, mnemonic);
5669 if (current_templates != NULL
5670 /* MOVS or CMPS */
5671 && (current_templates->start->base_opcode | 2) == 0xa6
ddb62495 5672 && current_templates->start->opcode_space
04784e33
JB
5673 == SPACE_BASE
5674 && mnem_p[-2] == 's')
5675 {
5676 as_warn (_("found `%sd'; assuming `%sl' was meant"),
5677 mnemonic, mnemonic);
5678 i.suffix = LONG_MNEM_SUFFIX;
5679 }
5680 else
5681 {
5682 current_templates = NULL;
5683 mnem_p[-1] = 'd';
5684 }
5685 }
1c529385 5686 break;
29b0f896 5687 }
29b0f896 5688 }
1c529385 5689
29b0f896
AM
5690 if (!current_templates)
5691 {
04784e33
JB
5692 if (pass1)
5693 as_bad (_("no such instruction: `%s'"), token_start);
29b0f896
AM
5694 return NULL;
5695 }
5696 }
252b5132 5697
0cfa3eb3
JB
5698 if (current_templates->start->opcode_modifier.jump == JUMP
5699 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
5700 {
5701 /* Check for a branch hint. We allow ",pt" and ",pn" for
5702 predict taken and predict not taken respectively.
5703 I'm not sure that branch hints actually do anything on loop
5704 and jcxz insns (JumpByte) for current Pentium4 chips. They
5705 may work in the future and it doesn't hurt to accept them
5706 now. */
5707 if (l[0] == ',' && l[1] == 'p')
5708 {
5709 if (l[2] == 't')
5710 {
5711 if (!add_prefix (DS_PREFIX_OPCODE))
5712 return NULL;
5713 l += 3;
5714 }
5715 else if (l[2] == 'n')
5716 {
5717 if (!add_prefix (CS_PREFIX_OPCODE))
5718 return NULL;
5719 l += 3;
5720 }
5721 }
5722 }
5723 /* Any other comma loses. */
5724 if (*l == ',')
5725 {
5726 as_bad (_("invalid character %s in mnemonic"),
5727 output_invalid (*l));
5728 return NULL;
5729 }
252b5132 5730
29b0f896 5731 /* Check if instruction is supported on specified architecture. */
5c6af06e
JB
5732 supported = 0;
5733 for (t = current_templates->start; t < current_templates->end; ++t)
5734 {
c0f3af97 5735 supported |= cpu_flags_match (t);
9db83a32
JB
5736
5737 if (i.suffix == QWORD_MNEM_SUFFIX && !q_suffix_allowed (t))
5738 supported &= ~CPU_FLAGS_64BIT_MATCH;
5739
c0f3af97 5740 if (supported == CPU_FLAGS_PERFECT_MATCH)
d59a54c2 5741 return l;
29b0f896 5742 }
3629bb00 5743
9db83a32
JB
5744 if (pass1)
5745 {
5746 if (supported & CPU_FLAGS_64BIT_MATCH)
5747 i.error = unsupported_on_arch;
5748 else
5749 i.error = unsupported_64bit;
5750 }
252b5132 5751
548d0ee6 5752 return NULL;
29b0f896 5753}
252b5132 5754
29b0f896 5755static char *
e3bb37b5 5756parse_operands (char *l, const char *mnemonic)
29b0f896
AM
5757{
5758 char *token_start;
3138f287 5759
29b0f896
AM
5760 /* 1 if operand is pending after ','. */
5761 unsigned int expecting_operand = 0;
252b5132 5762
29b0f896
AM
5763 while (*l != END_OF_INSN)
5764 {
e68c3d59
JB
5765 /* Non-zero if operand parens not balanced. */
5766 unsigned int paren_not_balanced = 0;
5767 /* True if inside double quotes. */
5768 bool in_quotes = false;
5769
29b0f896
AM
5770 /* Skip optional white space before operand. */
5771 if (is_space_char (*l))
5772 ++l;
d02603dc 5773 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
29b0f896
AM
5774 {
5775 as_bad (_("invalid character %s before operand %d"),
5776 output_invalid (*l),
5777 i.operands + 1);
5778 return NULL;
5779 }
d02603dc 5780 token_start = l; /* After white space. */
e68c3d59 5781 while (in_quotes || paren_not_balanced || *l != ',')
29b0f896
AM
5782 {
5783 if (*l == END_OF_INSN)
5784 {
e68c3d59
JB
5785 if (in_quotes)
5786 {
5787 as_bad (_("unbalanced double quotes in operand %d."),
5788 i.operands + 1);
5789 return NULL;
5790 }
29b0f896
AM
5791 if (paren_not_balanced)
5792 {
98ff9f1c
JB
5793 know (!intel_syntax);
5794 as_bad (_("unbalanced parenthesis in operand %d."),
5795 i.operands + 1);
29b0f896
AM
5796 return NULL;
5797 }
5798 else
5799 break; /* we are done */
5800 }
e68c3d59
JB
5801 else if (*l == '\\' && l[1] == '"')
5802 ++l;
5803 else if (*l == '"')
5804 in_quotes = !in_quotes;
5805 else if (!in_quotes && !is_operand_char (*l) && !is_space_char (*l))
29b0f896
AM
5806 {
5807 as_bad (_("invalid character %s in operand %d"),
5808 output_invalid (*l),
5809 i.operands + 1);
5810 return NULL;
5811 }
e68c3d59 5812 if (!intel_syntax && !in_quotes)
29b0f896
AM
5813 {
5814 if (*l == '(')
5815 ++paren_not_balanced;
5816 if (*l == ')')
5817 --paren_not_balanced;
5818 }
29b0f896
AM
5819 l++;
5820 }
5821 if (l != token_start)
5822 { /* Yes, we've read in another operand. */
5823 unsigned int operand_ok;
5824 this_operand = i.operands++;
5825 if (i.operands > MAX_OPERANDS)
5826 {
5827 as_bad (_("spurious operands; (%d operands/instruction max)"),
5828 MAX_OPERANDS);
5829 return NULL;
5830 }
9d46ce34 5831 i.types[this_operand].bitfield.unspecified = 1;
29b0f896
AM
5832 /* Now parse operand adding info to 'i' as we go along. */
5833 END_STRING_AND_SAVE (l);
5834
1286ab78
L
5835 if (i.mem_operands > 1)
5836 {
5837 as_bad (_("too many memory references for `%s'"),
5838 mnemonic);
5839 return 0;
5840 }
5841
29b0f896
AM
5842 if (intel_syntax)
5843 operand_ok =
5844 i386_intel_operand (token_start,
5845 intel_float_operand (mnemonic));
5846 else
a7619375 5847 operand_ok = i386_att_operand (token_start);
29b0f896
AM
5848
5849 RESTORE_END_STRING (l);
5850 if (!operand_ok)
5851 return NULL;
5852 }
5853 else
5854 {
5855 if (expecting_operand)
5856 {
5857 expecting_operand_after_comma:
5858 as_bad (_("expecting operand after ','; got nothing"));
5859 return NULL;
5860 }
5861 if (*l == ',')
5862 {
5863 as_bad (_("expecting operand before ','; got nothing"));
5864 return NULL;
5865 }
5866 }
7f3f1ea2 5867
29b0f896
AM
5868 /* Now *l must be either ',' or END_OF_INSN. */
5869 if (*l == ',')
5870 {
5871 if (*++l == END_OF_INSN)
5872 {
5873 /* Just skip it, if it's \n complain. */
5874 goto expecting_operand_after_comma;
5875 }
5876 expecting_operand = 1;
5877 }
5878 }
5879 return l;
5880}
7f3f1ea2 5881
050dfa73 5882static void
783c187b 5883swap_2_operands (unsigned int xchg1, unsigned int xchg2)
050dfa73
MM
5884{
5885 union i386_op temp_op;
40fb9820 5886 i386_operand_type temp_type;
c48dadc9 5887 unsigned int temp_flags;
050dfa73 5888 enum bfd_reloc_code_real temp_reloc;
4eed87de 5889
050dfa73
MM
5890 temp_type = i.types[xchg2];
5891 i.types[xchg2] = i.types[xchg1];
5892 i.types[xchg1] = temp_type;
c48dadc9
JB
5893
5894 temp_flags = i.flags[xchg2];
5895 i.flags[xchg2] = i.flags[xchg1];
5896 i.flags[xchg1] = temp_flags;
5897
050dfa73
MM
5898 temp_op = i.op[xchg2];
5899 i.op[xchg2] = i.op[xchg1];
5900 i.op[xchg1] = temp_op;
c48dadc9 5901
050dfa73
MM
5902 temp_reloc = i.reloc[xchg2];
5903 i.reloc[xchg2] = i.reloc[xchg1];
5904 i.reloc[xchg1] = temp_reloc;
43234a1e 5905
6225c532 5906 if (i.mask.reg)
43234a1e 5907 {
6225c532
JB
5908 if (i.mask.operand == xchg1)
5909 i.mask.operand = xchg2;
5910 else if (i.mask.operand == xchg2)
5911 i.mask.operand = xchg1;
43234a1e 5912 }
a5748e0d 5913 if (i.broadcast.type || i.broadcast.bytes)
43234a1e 5914 {
5273a3cd
JB
5915 if (i.broadcast.operand == xchg1)
5916 i.broadcast.operand = xchg2;
5917 else if (i.broadcast.operand == xchg2)
5918 i.broadcast.operand = xchg1;
43234a1e 5919 }
050dfa73
MM
5920}
5921
29b0f896 5922static void
e3bb37b5 5923swap_operands (void)
29b0f896 5924{
b7c61d9a 5925 switch (i.operands)
050dfa73 5926 {
c0f3af97 5927 case 5:
b7c61d9a 5928 case 4:
4d456e3d 5929 swap_2_operands (1, i.operands - 2);
1a0670f3 5930 /* Fall through. */
b7c61d9a
L
5931 case 3:
5932 case 2:
4d456e3d 5933 swap_2_operands (0, i.operands - 1);
b7c61d9a
L
5934 break;
5935 default:
5936 abort ();
29b0f896 5937 }
29b0f896
AM
5938
5939 if (i.mem_operands == 2)
5940 {
5e042380 5941 const reg_entry *temp_seg;
29b0f896
AM
5942 temp_seg = i.seg[0];
5943 i.seg[0] = i.seg[1];
5944 i.seg[1] = temp_seg;
5945 }
5946}
252b5132 5947
29b0f896
AM
5948/* Try to ensure constant immediates are represented in the smallest
5949 opcode possible. */
5950static void
e3bb37b5 5951optimize_imm (void)
29b0f896
AM
5952{
5953 char guess_suffix = 0;
5954 int op;
252b5132 5955
29b0f896
AM
5956 if (i.suffix)
5957 guess_suffix = i.suffix;
5958 else if (i.reg_operands)
5959 {
5960 /* Figure out a suffix from the last register operand specified.
75e5731b
JB
5961 We can't do this properly yet, i.e. excluding special register
5962 instances, but the following works for instructions with
5963 immediates. In any case, we can't set i.suffix yet. */
29b0f896 5964 for (op = i.operands; --op >= 0;)
bab6aec1
JB
5965 if (i.types[op].bitfield.class != Reg)
5966 continue;
5967 else if (i.types[op].bitfield.byte)
7ab9ffdd 5968 {
40fb9820
L
5969 guess_suffix = BYTE_MNEM_SUFFIX;
5970 break;
5971 }
bab6aec1 5972 else if (i.types[op].bitfield.word)
252b5132 5973 {
40fb9820
L
5974 guess_suffix = WORD_MNEM_SUFFIX;
5975 break;
5976 }
bab6aec1 5977 else if (i.types[op].bitfield.dword)
40fb9820
L
5978 {
5979 guess_suffix = LONG_MNEM_SUFFIX;
5980 break;
5981 }
bab6aec1 5982 else if (i.types[op].bitfield.qword)
40fb9820
L
5983 {
5984 guess_suffix = QWORD_MNEM_SUFFIX;
29b0f896 5985 break;
252b5132 5986 }
29b0f896
AM
5987 }
5988 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5989 guess_suffix = WORD_MNEM_SUFFIX;
5990
5991 for (op = i.operands; --op >= 0;)
40fb9820 5992 if (operand_type_check (i.types[op], imm))
29b0f896
AM
5993 {
5994 switch (i.op[op].imms->X_op)
252b5132 5995 {
29b0f896
AM
5996 case O_constant:
5997 /* If a suffix is given, this operand may be shortened. */
5998 switch (guess_suffix)
252b5132 5999 {
29b0f896 6000 case LONG_MNEM_SUFFIX:
40fb9820
L
6001 i.types[op].bitfield.imm32 = 1;
6002 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
6003 break;
6004 case WORD_MNEM_SUFFIX:
40fb9820
L
6005 i.types[op].bitfield.imm16 = 1;
6006 i.types[op].bitfield.imm32 = 1;
6007 i.types[op].bitfield.imm32s = 1;
6008 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
6009 break;
6010 case BYTE_MNEM_SUFFIX:
40fb9820
L
6011 i.types[op].bitfield.imm8 = 1;
6012 i.types[op].bitfield.imm8s = 1;
6013 i.types[op].bitfield.imm16 = 1;
6014 i.types[op].bitfield.imm32 = 1;
6015 i.types[op].bitfield.imm32s = 1;
6016 i.types[op].bitfield.imm64 = 1;
29b0f896 6017 break;
252b5132 6018 }
252b5132 6019
29b0f896
AM
6020 /* If this operand is at most 16 bits, convert it
6021 to a signed 16 bit number before trying to see
6022 whether it will fit in an even smaller size.
6023 This allows a 16-bit operand such as $0xffe0 to
6024 be recognised as within Imm8S range. */
40fb9820 6025 if ((i.types[op].bitfield.imm16)
7e96fb68 6026 && fits_in_unsigned_word (i.op[op].imms->X_add_number))
252b5132 6027 {
87ed972d
JB
6028 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
6029 ^ 0x8000) - 0x8000);
29b0f896 6030 }
a28def75
L
6031#ifdef BFD64
6032 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
40fb9820 6033 if ((i.types[op].bitfield.imm32)
7e96fb68 6034 && fits_in_unsigned_long (i.op[op].imms->X_add_number))
29b0f896
AM
6035 {
6036 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
6037 ^ ((offsetT) 1 << 31))
6038 - ((offsetT) 1 << 31));
6039 }
a28def75 6040#endif
40fb9820 6041 i.types[op]
c6fb90c8
L
6042 = operand_type_or (i.types[op],
6043 smallest_imm_type (i.op[op].imms->X_add_number));
252b5132 6044
29b0f896
AM
6045 /* We must avoid matching of Imm32 templates when 64bit
6046 only immediate is available. */
6047 if (guess_suffix == QWORD_MNEM_SUFFIX)
40fb9820 6048 i.types[op].bitfield.imm32 = 0;
29b0f896 6049 break;
252b5132 6050
29b0f896
AM
6051 case O_absent:
6052 case O_register:
6053 abort ();
6054
6055 /* Symbols and expressions. */
6056 default:
9cd96992
JB
6057 /* Convert symbolic operand to proper sizes for matching, but don't
6058 prevent matching a set of insns that only supports sizes other
6059 than those matching the insn suffix. */
6060 {
40fb9820 6061 i386_operand_type mask, allowed;
87ed972d 6062 const insn_template *t = current_templates->start;
9cd96992 6063
0dfbf9d7 6064 operand_type_set (&mask, 0);
9cd96992
JB
6065 switch (guess_suffix)
6066 {
6067 case QWORD_MNEM_SUFFIX:
40fb9820
L
6068 mask.bitfield.imm64 = 1;
6069 mask.bitfield.imm32s = 1;
9cd96992
JB
6070 break;
6071 case LONG_MNEM_SUFFIX:
40fb9820 6072 mask.bitfield.imm32 = 1;
9cd96992
JB
6073 break;
6074 case WORD_MNEM_SUFFIX:
40fb9820 6075 mask.bitfield.imm16 = 1;
9cd96992
JB
6076 break;
6077 case BYTE_MNEM_SUFFIX:
40fb9820 6078 mask.bitfield.imm8 = 1;
9cd96992
JB
6079 break;
6080 default:
9cd96992
JB
6081 break;
6082 }
8f0212ac
JB
6083
6084 allowed = operand_type_and (t->operand_types[op], mask);
6085 while (++t < current_templates->end)
6086 {
6087 allowed = operand_type_or (allowed, t->operand_types[op]);
6088 allowed = operand_type_and (allowed, mask);
6089 }
6090
0dfbf9d7 6091 if (!operand_type_all_zero (&allowed))
c6fb90c8 6092 i.types[op] = operand_type_and (i.types[op], mask);
9cd96992 6093 }
29b0f896 6094 break;
252b5132 6095 }
29b0f896
AM
6096 }
6097}
47926f60 6098
29b0f896 6099/* Try to use the smallest displacement type too. */
0de704b9
JB
6100static bool
6101optimize_disp (const insn_template *t)
29b0f896 6102{
0de704b9 6103 unsigned int op;
3e73aa7c 6104
0de704b9
JB
6105 if (!want_disp32 (t)
6106 && (!t->opcode_modifier.jump
6107 || i.jumpabsolute || i.types[0].bitfield.baseindex))
6108 {
6109 for (op = 0; op < i.operands; ++op)
6110 {
6111 const expressionS *exp = i.op[op].disps;
6112
6113 if (!operand_type_check (i.types[op], disp))
6114 continue;
6115
6116 if (exp->X_op != O_constant)
6117 continue;
6118
6119 /* Since displacement is signed extended to 64bit, don't allow
6120 disp32 if it is out of range. */
6121 if (fits_in_signed_long (exp->X_add_number))
6122 continue;
6123
6124 i.types[op].bitfield.disp32 = 0;
6125 if (i.types[op].bitfield.baseindex)
6126 {
6127 as_bad (_("0x%" PRIx64 " out of range of signed 32bit displacement"),
6128 (uint64_t) exp->X_add_number);
6129 return false;
6130 }
6131 }
6132 }
6133
6134 /* Don't optimize displacement for movabs since it only takes 64bit
6135 displacement. */
6136 if (i.disp_encoding > disp_encoding_8bit
6137 || (flag_code == CODE_64BIT && t->mnem_off == MN_movabs))
6138 return true;
6139
6140 for (op = i.operands; op-- > 0;)
40fb9820 6141 if (operand_type_check (i.types[op], disp))
252b5132 6142 {
b300c311 6143 if (i.op[op].disps->X_op == O_constant)
252b5132 6144 {
91d6fa6a 6145 offsetT op_disp = i.op[op].disps->X_add_number;
29b0f896 6146
91d6fa6a 6147 if (!op_disp && i.types[op].bitfield.baseindex)
b300c311 6148 {
2f2be86b
JB
6149 i.types[op] = operand_type_and_not (i.types[op], anydisp);
6150 i.op[op].disps = NULL;
b300c311 6151 i.disp_operands--;
f185acdd
JB
6152 continue;
6153 }
6154
6155 if (i.types[op].bitfield.disp16
cd613c1f 6156 && fits_in_unsigned_word (op_disp))
f185acdd
JB
6157 {
6158 /* If this operand is at most 16 bits, convert
6159 to a signed 16 bit number and don't use 64bit
6160 displacement. */
6161 op_disp = ((op_disp ^ 0x8000) - 0x8000);
6162 i.types[op].bitfield.disp64 = 0;
b300c311 6163 }
f185acdd 6164
28a167a4 6165#ifdef BFD64
a50187b2 6166 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
a775efc8
JB
6167 if ((flag_code != CODE_64BIT
6168 ? i.types[op].bitfield.disp32
0de704b9
JB
6169 : want_disp32 (t)
6170 && (!t->opcode_modifier.jump
a775efc8 6171 || i.jumpabsolute || i.types[op].bitfield.baseindex))
a50187b2 6172 && fits_in_unsigned_long (op_disp))
b300c311 6173 {
a50187b2
JB
6174 /* If this operand is at most 32 bits, convert
6175 to a signed 32 bit number and don't use 64bit
6176 displacement. */
6177 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
6178 i.types[op].bitfield.disp64 = 0;
6179 i.types[op].bitfield.disp32 = 1;
6180 }
28a167a4 6181
a50187b2
JB
6182 if (flag_code == CODE_64BIT && fits_in_signed_long (op_disp))
6183 {
6184 i.types[op].bitfield.disp64 = 0;
a775efc8 6185 i.types[op].bitfield.disp32 = 1;
b300c311 6186 }
28a167a4 6187#endif
40fb9820 6188 if ((i.types[op].bitfield.disp32
40fb9820 6189 || i.types[op].bitfield.disp16)
b5014f7a 6190 && fits_in_disp8 (op_disp))
40fb9820 6191 i.types[op].bitfield.disp8 = 1;
77c59789
JB
6192
6193 i.op[op].disps->X_add_number = op_disp;
252b5132 6194 }
67a4f2b7
AO
6195 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6196 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
6197 {
6198 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
6199 i.op[op].disps, 0, i.reloc[op]);
2f2be86b 6200 i.types[op] = operand_type_and_not (i.types[op], anydisp);
67a4f2b7
AO
6201 }
6202 else
b300c311 6203 /* We only support 64bit displacement on constants. */
40fb9820 6204 i.types[op].bitfield.disp64 = 0;
252b5132 6205 }
0de704b9
JB
6206
6207 return true;
29b0f896
AM
6208}
6209
4a1b91ea
L
6210/* Return 1 if there is a match in broadcast bytes between operand
6211 GIVEN and instruction template T. */
6212
6213static INLINE int
6214match_broadcast_size (const insn_template *t, unsigned int given)
6215{
6216 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
6217 && i.types[given].bitfield.byte)
6218 || (t->opcode_modifier.broadcast == WORD_BROADCAST
6219 && i.types[given].bitfield.word)
6220 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
6221 && i.types[given].bitfield.dword)
6222 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
6223 && i.types[given].bitfield.qword));
6224}
6225
6c30d220
L
6226/* Check if operands are valid for the instruction. */
6227
6228static int
6229check_VecOperands (const insn_template *t)
6230{
43234a1e 6231 unsigned int op;
e2195274 6232 i386_cpu_flags cpu;
e2195274
JB
6233
6234 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
6235 any one operand are implicity requiring AVX512VL support if the actual
6236 operand size is YMMword or XMMword. Since this function runs after
6237 template matching, there's no need to check for YMMword/XMMword in
6238 the template. */
6239 cpu = cpu_flags_and (t->cpu_flags, avx512);
6240 if (!cpu_flags_all_zero (&cpu)
6241 && !t->cpu_flags.bitfield.cpuavx512vl
6242 && !cpu_arch_flags.bitfield.cpuavx512vl)
6243 {
6244 for (op = 0; op < t->operands; ++op)
6245 {
6246 if (t->operand_types[op].bitfield.zmmword
6247 && (i.types[op].bitfield.ymmword
6248 || i.types[op].bitfield.xmmword))
6249 {
6250 i.error = unsupported;
6251 return 1;
6252 }
6253 }
6254 }
43234a1e 6255
22c36940
JB
6256 /* Somewhat similarly, templates specifying both AVX and AVX2 are
6257 requiring AVX2 support if the actual operand size is YMMword. */
6258 if (t->cpu_flags.bitfield.cpuavx
6259 && t->cpu_flags.bitfield.cpuavx2
6260 && !cpu_arch_flags.bitfield.cpuavx2)
6261 {
6262 for (op = 0; op < t->operands; ++op)
6263 {
6264 if (t->operand_types[op].bitfield.xmmword
6265 && i.types[op].bitfield.ymmword)
6266 {
6267 i.error = unsupported;
6268 return 1;
6269 }
6270 }
6271 }
6272
6c30d220 6273 /* Without VSIB byte, we can't have a vector register for index. */
63112cd6 6274 if (!t->opcode_modifier.sib
6c30d220 6275 && i.index_reg
1b54b8d7
JB
6276 && (i.index_reg->reg_type.bitfield.xmmword
6277 || i.index_reg->reg_type.bitfield.ymmword
6278 || i.index_reg->reg_type.bitfield.zmmword))
6c30d220
L
6279 {
6280 i.error = unsupported_vector_index_register;
6281 return 1;
6282 }
6283
ad8ecc81 6284 /* Check if default mask is allowed. */
255571cd 6285 if (t->opcode_modifier.operandconstraint == NO_DEFAULT_MASK
6225c532 6286 && (!i.mask.reg || i.mask.reg->reg_num == 0))
ad8ecc81
MZ
6287 {
6288 i.error = no_default_mask;
6289 return 1;
6290 }
6291
7bab8ab5
JB
6292 /* For VSIB byte, we need a vector register for index, and all vector
6293 registers must be distinct. */
260cd341 6294 if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
7bab8ab5
JB
6295 {
6296 if (!i.index_reg
63112cd6 6297 || !((t->opcode_modifier.sib == VECSIB128
1b54b8d7 6298 && i.index_reg->reg_type.bitfield.xmmword)
63112cd6 6299 || (t->opcode_modifier.sib == VECSIB256
1b54b8d7 6300 && i.index_reg->reg_type.bitfield.ymmword)
63112cd6 6301 || (t->opcode_modifier.sib == VECSIB512
1b54b8d7 6302 && i.index_reg->reg_type.bitfield.zmmword)))
7bab8ab5
JB
6303 {
6304 i.error = invalid_vsib_address;
6305 return 1;
6306 }
6307
6225c532
JB
6308 gas_assert (i.reg_operands == 2 || i.mask.reg);
6309 if (i.reg_operands == 2 && !i.mask.reg)
43234a1e 6310 {
3528c362 6311 gas_assert (i.types[0].bitfield.class == RegSIMD);
1b54b8d7
JB
6312 gas_assert (i.types[0].bitfield.xmmword
6313 || i.types[0].bitfield.ymmword);
3528c362 6314 gas_assert (i.types[2].bitfield.class == RegSIMD);
1b54b8d7
JB
6315 gas_assert (i.types[2].bitfield.xmmword
6316 || i.types[2].bitfield.ymmword);
43234a1e
L
6317 if (operand_check == check_none)
6318 return 0;
6319 if (register_number (i.op[0].regs)
6320 != register_number (i.index_reg)
6321 && register_number (i.op[2].regs)
6322 != register_number (i.index_reg)
6323 && register_number (i.op[0].regs)
6324 != register_number (i.op[2].regs))
6325 return 0;
6326 if (operand_check == check_error)
6327 {
6328 i.error = invalid_vector_register_set;
6329 return 1;
6330 }
6331 as_warn (_("mask, index, and destination registers should be distinct"));
6332 }
6225c532 6333 else if (i.reg_operands == 1 && i.mask.reg)
8444f82a 6334 {
3528c362 6335 if (i.types[1].bitfield.class == RegSIMD
1b54b8d7
JB
6336 && (i.types[1].bitfield.xmmword
6337 || i.types[1].bitfield.ymmword
6338 || i.types[1].bitfield.zmmword)
8444f82a
MZ
6339 && (register_number (i.op[1].regs)
6340 == register_number (i.index_reg)))
6341 {
6342 if (operand_check == check_error)
6343 {
6344 i.error = invalid_vector_register_set;
6345 return 1;
6346 }
6347 if (operand_check != check_none)
6348 as_warn (_("index and destination registers should be distinct"));
6349 }
6350 }
43234a1e 6351 }
7bab8ab5 6352
fc141319
L
6353 /* For AMX instructions with 3 TMM register operands, all operands
6354 must be distinct. */
6355 if (i.reg_operands == 3
6356 && t->operand_types[0].bitfield.tmmword
6357 && (i.op[0].regs == i.op[1].regs
6358 || i.op[0].regs == i.op[2].regs
6359 || i.op[1].regs == i.op[2].regs))
6360 {
6361 i.error = invalid_tmm_register_set;
6362 return 1;
260cd341
LC
6363 }
6364
0cc78721
CL
6365 /* For some special instructions require that destination must be distinct
6366 from source registers. */
255571cd 6367 if (t->opcode_modifier.operandconstraint == DISTINCT_DEST)
0cc78721
CL
6368 {
6369 unsigned int dest_reg = i.operands - 1;
6370
6371 know (i.operands >= 3);
6372
6373 /* #UD if dest_reg == src1_reg or dest_reg == src2_reg. */
6374 if (i.op[dest_reg - 1].regs == i.op[dest_reg].regs
6375 || (i.reg_operands > 2
6376 && i.op[dest_reg - 2].regs == i.op[dest_reg].regs))
6377 {
6378 i.error = invalid_dest_and_src_register_set;
6379 return 1;
6380 }
6381 }
6382
43234a1e
L
6383 /* Check if broadcast is supported by the instruction and is applied
6384 to the memory operand. */
a5748e0d 6385 if (i.broadcast.type || i.broadcast.bytes)
43234a1e 6386 {
8e6e0792 6387 i386_operand_type type, overlap;
43234a1e
L
6388
6389 /* Check if specified broadcast is supported in this instruction,
4a1b91ea 6390 and its broadcast bytes match the memory operand. */
5273a3cd 6391 op = i.broadcast.operand;
8e6e0792 6392 if (!t->opcode_modifier.broadcast
c48dadc9 6393 || !(i.flags[op] & Operand_Mem)
c39e5b26 6394 || (!i.types[op].bitfield.unspecified
4a1b91ea 6395 && !match_broadcast_size (t, op)))
43234a1e
L
6396 {
6397 bad_broadcast:
6398 i.error = unsupported_broadcast;
6399 return 1;
6400 }
8e6e0792
JB
6401
6402 operand_type_set (&type, 0);
a5748e0d 6403 switch (get_broadcast_bytes (t, false))
8e6e0792 6404 {
4a1b91ea
L
6405 case 2:
6406 type.bitfield.word = 1;
6407 break;
6408 case 4:
6409 type.bitfield.dword = 1;
6410 break;
8e6e0792
JB
6411 case 8:
6412 type.bitfield.qword = 1;
6413 break;
6414 case 16:
6415 type.bitfield.xmmword = 1;
6416 break;
6417 case 32:
6418 type.bitfield.ymmword = 1;
6419 break;
6420 case 64:
6421 type.bitfield.zmmword = 1;
6422 break;
6423 default:
6424 goto bad_broadcast;
6425 }
6426
6427 overlap = operand_type_and (type, t->operand_types[op]);
bc49bfd8
JB
6428 if (t->operand_types[op].bitfield.class == RegSIMD
6429 && t->operand_types[op].bitfield.byte
6430 + t->operand_types[op].bitfield.word
6431 + t->operand_types[op].bitfield.dword
6432 + t->operand_types[op].bitfield.qword > 1)
6433 {
6434 overlap.bitfield.xmmword = 0;
6435 overlap.bitfield.ymmword = 0;
6436 overlap.bitfield.zmmword = 0;
6437 }
8e6e0792
JB
6438 if (operand_type_all_zero (&overlap))
6439 goto bad_broadcast;
6440
9c19e9ec 6441 if (t->opcode_modifier.checkoperandsize)
8e6e0792
JB
6442 {
6443 unsigned int j;
6444
e2195274 6445 type.bitfield.baseindex = 1;
8e6e0792
JB
6446 for (j = 0; j < i.operands; ++j)
6447 {
6448 if (j != op
6449 && !operand_type_register_match(i.types[j],
6450 t->operand_types[j],
6451 type,
6452 t->operand_types[op]))
6453 goto bad_broadcast;
6454 }
6455 }
43234a1e
L
6456 }
6457 /* If broadcast is supported in this instruction, we need to check if
6458 operand of one-element size isn't specified without broadcast. */
6459 else if (t->opcode_modifier.broadcast && i.mem_operands)
6460 {
6461 /* Find memory operand. */
6462 for (op = 0; op < i.operands; op++)
8dc0818e 6463 if (i.flags[op] & Operand_Mem)
43234a1e
L
6464 break;
6465 gas_assert (op < i.operands);
6466 /* Check size of the memory operand. */
4a1b91ea 6467 if (match_broadcast_size (t, op))
43234a1e
L
6468 {
6469 i.error = broadcast_needed;
6470 return 1;
6471 }
6472 }
c39e5b26
JB
6473 else
6474 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
43234a1e
L
6475
6476 /* Check if requested masking is supported. */
6225c532 6477 if (i.mask.reg)
43234a1e 6478 {
ae2387fe
JB
6479 switch (t->opcode_modifier.masking)
6480 {
6481 case BOTH_MASKING:
6482 break;
6483 case MERGING_MASKING:
6225c532 6484 if (i.mask.zeroing)
ae2387fe
JB
6485 {
6486 case 0:
6487 i.error = unsupported_masking;
6488 return 1;
6489 }
6490 break;
6491 case DYNAMIC_MASKING:
6492 /* Memory destinations allow only merging masking. */
6225c532 6493 if (i.mask.zeroing && i.mem_operands)
ae2387fe
JB
6494 {
6495 /* Find memory operand. */
6496 for (op = 0; op < i.operands; op++)
c48dadc9 6497 if (i.flags[op] & Operand_Mem)
ae2387fe
JB
6498 break;
6499 gas_assert (op < i.operands);
6500 if (op == i.operands - 1)
6501 {
6502 i.error = unsupported_masking;
6503 return 1;
6504 }
6505 }
6506 break;
6507 default:
6508 abort ();
6509 }
43234a1e
L
6510 }
6511
6512 /* Check if masking is applied to dest operand. */
6225c532 6513 if (i.mask.reg && (i.mask.operand != i.operands - 1))
43234a1e
L
6514 {
6515 i.error = mask_not_on_destination;
6516 return 1;
6517 }
6518
43234a1e 6519 /* Check RC/SAE. */
ca5312a2 6520 if (i.rounding.type != rc_none)
43234a1e 6521 {
a80195f1 6522 if (!t->opcode_modifier.sae
cf665fee
JB
6523 || ((i.rounding.type != saeonly) != t->opcode_modifier.staticrounding)
6524 || i.mem_operands)
43234a1e
L
6525 {
6526 i.error = unsupported_rc_sae;
6527 return 1;
6528 }
cf665fee
JB
6529
6530 /* Non-EVEX.LIG forms need to have a ZMM register as at least one
6531 operand. */
6532 if (t->opcode_modifier.evex != EVEXLIG)
7bab8ab5 6533 {
cf665fee
JB
6534 for (op = 0; op < t->operands; ++op)
6535 if (i.types[op].bitfield.zmmword)
6536 break;
6537 if (op >= t->operands)
6538 {
6539 i.error = operand_size_mismatch;
6540 return 1;
6541 }
7bab8ab5 6542 }
6c30d220
L
6543 }
6544
da4977e0
JB
6545 /* Check the special Imm4 cases; must be the first operand. */
6546 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6547 {
6548 if (i.op[0].imms->X_op != O_constant
6549 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6550 {
6551 i.error = bad_imm4;
6552 return 1;
6553 }
6554
6555 /* Turn off Imm<N> so that update_imm won't complain. */
6556 operand_type_set (&i.types[0], 0);
6557 }
6558
43234a1e 6559 /* Check vector Disp8 operand. */
b5014f7a 6560 if (t->opcode_modifier.disp8memshift
1a42a9fe 6561 && i.disp_encoding <= disp_encoding_8bit)
43234a1e 6562 {
9b345ce8 6563 if (i.broadcast.type || i.broadcast.bytes)
4a1b91ea 6564 i.memshift = t->opcode_modifier.broadcast - 1;
7091c612 6565 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
43234a1e 6566 i.memshift = t->opcode_modifier.disp8memshift;
7091c612
JB
6567 else
6568 {
125ff819 6569 const i386_operand_type *type = NULL, *fallback = NULL;
7091c612
JB
6570
6571 i.memshift = 0;
6572 for (op = 0; op < i.operands; op++)
8dc0818e 6573 if (i.flags[op] & Operand_Mem)
7091c612 6574 {
4174bfff
JB
6575 if (t->opcode_modifier.evex == EVEXLIG)
6576 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6577 else if (t->operand_types[op].bitfield.xmmword
6578 + t->operand_types[op].bitfield.ymmword
6579 + t->operand_types[op].bitfield.zmmword <= 1)
7091c612
JB
6580 type = &t->operand_types[op];
6581 else if (!i.types[op].bitfield.unspecified)
6582 type = &i.types[op];
125ff819
JB
6583 else /* Ambiguities get resolved elsewhere. */
6584 fallback = &t->operand_types[op];
7091c612 6585 }
3528c362 6586 else if (i.types[op].bitfield.class == RegSIMD
4174bfff 6587 && t->opcode_modifier.evex != EVEXLIG)
7091c612
JB
6588 {
6589 if (i.types[op].bitfield.zmmword)
6590 i.memshift = 6;
6591 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6592 i.memshift = 5;
6593 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6594 i.memshift = 4;
6595 }
6596
125ff819
JB
6597 if (!type && !i.memshift)
6598 type = fallback;
7091c612
JB
6599 if (type)
6600 {
6601 if (type->bitfield.zmmword)
6602 i.memshift = 6;
6603 else if (type->bitfield.ymmword)
6604 i.memshift = 5;
6605 else if (type->bitfield.xmmword)
6606 i.memshift = 4;
6607 }
6608
6609 /* For the check in fits_in_disp8(). */
6610 if (i.memshift == 0)
6611 i.memshift = -1;
6612 }
43234a1e
L
6613
6614 for (op = 0; op < i.operands; op++)
6615 if (operand_type_check (i.types[op], disp)
6616 && i.op[op].disps->X_op == O_constant)
6617 {
b5014f7a 6618 if (fits_in_disp8 (i.op[op].disps->X_add_number))
43234a1e 6619 {
b5014f7a
JB
6620 i.types[op].bitfield.disp8 = 1;
6621 return 0;
43234a1e 6622 }
b5014f7a 6623 i.types[op].bitfield.disp8 = 0;
43234a1e
L
6624 }
6625 }
b5014f7a
JB
6626
6627 i.memshift = 0;
43234a1e 6628
6c30d220
L
6629 return 0;
6630}
6631
da4977e0 6632/* Check if encoding requirements are met by the instruction. */
a683cc34
SP
6633
6634static int
da4977e0 6635VEX_check_encoding (const insn_template *t)
a683cc34 6636{
da4977e0
JB
6637 if (i.vec_encoding == vex_encoding_error)
6638 {
6639 i.error = unsupported;
6640 return 1;
6641 }
6642
86fa6981 6643 if (i.vec_encoding == vex_encoding_evex)
43234a1e 6644 {
86fa6981 6645 /* This instruction must be encoded with EVEX prefix. */
e771e7c9 6646 if (!is_evex_encoding (t))
86fa6981
L
6647 {
6648 i.error = unsupported;
6649 return 1;
6650 }
6651 return 0;
43234a1e
L
6652 }
6653
a683cc34 6654 if (!t->opcode_modifier.vex)
86fa6981
L
6655 {
6656 /* This instruction template doesn't have VEX prefix. */
6657 if (i.vec_encoding != vex_encoding_default)
6658 {
6659 i.error = unsupported;
6660 return 1;
6661 }
6662 return 0;
6663 }
a683cc34 6664
a683cc34
SP
6665 return 0;
6666}
6667
7b94647a
JB
6668/* Helper function for the progress() macro in match_template(). */
6669static INLINE enum i386_error progress (enum i386_error new,
6670 enum i386_error last,
6671 unsigned int line, unsigned int *line_p)
6672{
6673 if (line <= *line_p)
6674 return last;
6675 *line_p = line;
6676 return new;
6677}
6678
d3ce72d0 6679static const insn_template *
83b16ac6 6680match_template (char mnem_suffix)
29b0f896
AM
6681{
6682 /* Points to template once we've found it. */
d3ce72d0 6683 const insn_template *t;
40fb9820 6684 i386_operand_type overlap0, overlap1, overlap2, overlap3;
c0f3af97 6685 i386_operand_type overlap4;
29b0f896 6686 unsigned int found_reverse_match;
40fb9820 6687 i386_operand_type operand_types [MAX_OPERANDS];
539e75ad 6688 int addr_prefix_disp;
7b94647a
JB
6689 unsigned int j, size_match, check_register, errline = __LINE__;
6690 enum i386_error specific_error = number_of_operands_mismatch;
6691#define progress(err) progress (err, specific_error, __LINE__, &errline)
29b0f896 6692
c0f3af97
L
6693#if MAX_OPERANDS != 5
6694# error "MAX_OPERANDS must be 5."
f48ff2ae
L
6695#endif
6696
29b0f896 6697 found_reverse_match = 0;
539e75ad 6698 addr_prefix_disp = -1;
40fb9820 6699
45aa61fe 6700 for (t = current_templates->start; t < current_templates->end; t++)
29b0f896 6701 {
539e75ad 6702 addr_prefix_disp = -1;
dbbc8b7e 6703 found_reverse_match = 0;
539e75ad 6704
7b94647a 6705 /* Must have right number of operands. */
29b0f896
AM
6706 if (i.operands != t->operands)
6707 continue;
6708
50aecf8c 6709 /* Check processor support. */
7b94647a 6710 specific_error = progress (unsupported);
45a4bb20 6711 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
50aecf8c
L
6712 continue;
6713
e1d4d893 6714 /* Check AT&T mnemonic. */
7b94647a 6715 specific_error = progress (unsupported_with_intel_mnemonic);
e1d4d893 6716 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
1efbbeb4
L
6717 continue;
6718
4b5aaf5f 6719 /* Check AT&T/Intel syntax. */
7b94647a 6720 specific_error = progress (unsupported_syntax);
5c07affc 6721 if ((intel_syntax && t->opcode_modifier.attsyntax)
4b5aaf5f 6722 || (!intel_syntax && t->opcode_modifier.intelsyntax))
1efbbeb4
L
6723 continue;
6724
4b5aaf5f
L
6725 /* Check Intel64/AMD64 ISA. */
6726 switch (isa64)
6727 {
6728 default:
6729 /* Default: Don't accept Intel64. */
6730 if (t->opcode_modifier.isa64 == INTEL64)
6731 continue;
6732 break;
6733 case amd64:
6734 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6735 if (t->opcode_modifier.isa64 >= INTEL64)
6736 continue;
6737 break;
6738 case intel64:
6739 /* -mintel64: Don't accept AMD64. */
5990e377 6740 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
4b5aaf5f
L
6741 continue;
6742 break;
6743 }
6744
dc2be329 6745 /* Check the suffix. */
7b94647a 6746 specific_error = progress (invalid_instruction_suffix);
7505bb03
JB
6747 if ((t->opcode_modifier.no_bsuf && mnem_suffix == BYTE_MNEM_SUFFIX)
6748 || (t->opcode_modifier.no_wsuf && mnem_suffix == WORD_MNEM_SUFFIX)
6749 || (t->opcode_modifier.no_lsuf && mnem_suffix == LONG_MNEM_SUFFIX)
6750 || (t->opcode_modifier.no_ssuf && mnem_suffix == SHORT_MNEM_SUFFIX)
6751 || (t->opcode_modifier.no_qsuf && mnem_suffix == QWORD_MNEM_SUFFIX))
83b16ac6 6752 continue;
29b0f896 6753
7b94647a 6754 specific_error = progress (operand_size_mismatch);
3ac21baa
JB
6755 size_match = operand_size_match (t);
6756 if (!size_match)
7d5e4556 6757 continue;
539e75ad 6758
6f2f06be
JB
6759 /* This is intentionally not
6760
0cfa3eb3 6761 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6f2f06be
JB
6762
6763 as the case of a missing * on the operand is accepted (perhaps with
6764 a warning, issued further down). */
7b94647a 6765 specific_error = progress (operand_type_mismatch);
0cfa3eb3 6766 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
7b94647a 6767 continue;
6f2f06be 6768
a4d3acd2
JB
6769 /* In Intel syntax, normally we can check for memory operand size when
6770 there is no mnemonic suffix. But jmp and call have 2 different
6771 encodings with Dword memory operand size. Skip the "near" one
6772 (permitting a register operand) when "far" was requested. */
6773 if (i.far_branch
6774 && t->opcode_modifier.jump == JUMP_ABSOLUTE
6775 && t->operand_types[0].bitfield.class == Reg)
6776 continue;
6777
5c07affc
L
6778 for (j = 0; j < MAX_OPERANDS; j++)
6779 operand_types[j] = t->operand_types[j];
6780
9db83a32 6781 /* In general, don't allow 32-bit operands on pre-386. */
7b94647a
JB
6782 specific_error = progress (mnem_suffix ? invalid_instruction_suffix
6783 : operand_size_mismatch);
4873e243 6784 j = i.imm_operands + (t->operands > i.imm_operands + 1);
9db83a32
JB
6785 if (i.suffix == LONG_MNEM_SUFFIX
6786 && !cpu_arch_flags.bitfield.cpui386
45aa61fe 6787 && (intel_syntax
3cd7f3e3 6788 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
76d3f746
JB
6789 && !intel_float_operand (insn_name (t)))
6790 : intel_float_operand (insn_name (t)) != 2)
4873e243
JB
6791 && (t->operands == i.imm_operands
6792 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6793 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6794 && operand_types[i.imm_operands].bitfield.class != RegMask)
6795 || (operand_types[j].bitfield.class != RegMMX
6796 && operand_types[j].bitfield.class != RegSIMD
6797 && operand_types[j].bitfield.class != RegMask))
63112cd6 6798 && !t->opcode_modifier.sib)
192dc9c6
JB
6799 continue;
6800
29b0f896 6801 /* Do not verify operands when there are none. */
e365e234 6802 if (!t->operands)
da4977e0
JB
6803 {
6804 if (VEX_check_encoding (t))
6805 {
7b94647a 6806 specific_error = progress (i.error);
da4977e0
JB
6807 continue;
6808 }
6809
6810 /* We've found a match; break out of loop. */
6811 break;
6812 }
252b5132 6813
48bcea9f
JB
6814 if (!t->opcode_modifier.jump
6815 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6816 {
6817 /* There should be only one Disp operand. */
6818 for (j = 0; j < MAX_OPERANDS; j++)
6819 if (operand_type_check (operand_types[j], disp))
539e75ad 6820 break;
48bcea9f
JB
6821 if (j < MAX_OPERANDS)
6822 {
5b7c81bd 6823 bool override = (i.prefix[ADDR_PREFIX] != 0);
48bcea9f
JB
6824
6825 addr_prefix_disp = j;
6826
a775efc8
JB
6827 /* Address size prefix will turn Disp64 operand into Disp32 and
6828 Disp32/Disp16 one into Disp16/Disp32 respectively. */
48bcea9f 6829 switch (flag_code)
40fb9820 6830 {
48bcea9f
JB
6831 case CODE_16BIT:
6832 override = !override;
6833 /* Fall through. */
6834 case CODE_32BIT:
6835 if (operand_types[j].bitfield.disp32
6836 && operand_types[j].bitfield.disp16)
40fb9820 6837 {
48bcea9f
JB
6838 operand_types[j].bitfield.disp16 = override;
6839 operand_types[j].bitfield.disp32 = !override;
40fb9820 6840 }
a775efc8 6841 gas_assert (!operand_types[j].bitfield.disp64);
48bcea9f
JB
6842 break;
6843
6844 case CODE_64BIT:
a775efc8 6845 if (operand_types[j].bitfield.disp64)
40fb9820 6846 {
a775efc8 6847 gas_assert (!operand_types[j].bitfield.disp32);
48bcea9f 6848 operand_types[j].bitfield.disp32 = override;
a775efc8 6849 operand_types[j].bitfield.disp64 = !override;
40fb9820 6850 }
48bcea9f
JB
6851 operand_types[j].bitfield.disp16 = 0;
6852 break;
40fb9820 6853 }
539e75ad 6854 }
48bcea9f 6855 }
539e75ad 6856
56ffb741 6857 /* We check register size if needed. */
9c19e9ec 6858 if (t->opcode_modifier.checkoperandsize)
e2195274
JB
6859 {
6860 check_register = (1 << t->operands) - 1;
a5748e0d 6861 if (i.broadcast.type || i.broadcast.bytes)
5273a3cd 6862 check_register &= ~(1 << i.broadcast.operand);
e2195274
JB
6863 }
6864 else
6865 check_register = 0;
6866
c6fb90c8 6867 overlap0 = operand_type_and (i.types[0], operand_types[0]);
29b0f896
AM
6868 switch (t->operands)
6869 {
6870 case 1:
40fb9820 6871 if (!operand_type_match (overlap0, i.types[0]))
29b0f896 6872 continue;
ae9a0a51
JB
6873
6874 /* Allow the ModR/M encoding to be requested by using the {load} or
6875 {store} pseudo prefix on an applicable insn. */
6876 if (!t->opcode_modifier.modrm
6877 && i.reg_operands == 1
6878 && ((i.dir_encoding == dir_encoding_load
6879 && t->mnem_off != MN_pop)
6880 || (i.dir_encoding == dir_encoding_store
6881 && t->mnem_off != MN_push))
6882 /* Avoid BSWAP. */
6883 && t->mnem_off != MN_bswap)
6884 continue;
29b0f896 6885 break;
ae9a0a51 6886
29b0f896 6887 case 2:
33eaf5de 6888 /* xchg %eax, %eax is a special case. It is an alias for nop
8b38ad71
L
6889 only in 32bit mode and we can use opcode 0x90. In 64bit
6890 mode, we can't use 0x90 for xchg %eax, %eax since it should
6891 zero-extend %eax to %rax. */
ae9a0a51
JB
6892 if (t->base_opcode == 0x90
6893 && t->opcode_space == SPACE_BASE)
6894 {
6895 if (flag_code == CODE_64BIT
6896 && i.types[0].bitfield.instance == Accum
6897 && i.types[0].bitfield.dword
6898 && i.types[1].bitfield.instance == Accum)
6899 continue;
6900
6901 /* Allow the ModR/M encoding to be requested by using the
6902 {load} or {store} pseudo prefix. */
6903 if (i.dir_encoding == dir_encoding_load
6904 || i.dir_encoding == dir_encoding_store)
6905 continue;
6906 }
e3669c7f
JB
6907
6908 if (t->base_opcode == MOV_AX_DISP32
ddb62495 6909 && t->opcode_space == SPACE_BASE
69196391 6910 && t->mnem_off != MN_movabs)
e3669c7f
JB
6911 {
6912 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6913 if (i.reloc[0] == BFD_RELOC_386_GOT32)
6914 continue;
6915
6916 /* xrelease mov %eax, <disp> is another special case. It must not
6917 match the accumulator-only encoding of mov. */
6918 if (i.hle_prefix)
6919 continue;
ae9a0a51
JB
6920
6921 /* Allow the ModR/M encoding to be requested by using a suitable
6922 {load} or {store} pseudo prefix. */
6923 if (i.dir_encoding == (i.types[0].bitfield.instance == Accum
6924 ? dir_encoding_store
6925 : dir_encoding_load)
6926 && !i.types[0].bitfield.disp64
6927 && !i.types[1].bitfield.disp64)
6928 continue;
6929 }
6930
6931 /* Allow the ModR/M encoding to be requested by using the {load} or
6932 {store} pseudo prefix on an applicable insn. */
6933 if (!t->opcode_modifier.modrm
6934 && i.reg_operands == 1
6935 && i.imm_operands == 1
6936 && (i.dir_encoding == dir_encoding_load
6937 || i.dir_encoding == dir_encoding_store)
6938 && t->opcode_space == SPACE_BASE)
6939 {
6940 if (t->base_opcode == 0xb0 /* mov $imm, %reg */
6941 && i.dir_encoding == dir_encoding_store)
6942 continue;
6943
6944 if ((t->base_opcode | 0x38) == 0x3c /* <alu> $imm, %acc */
6945 && (t->base_opcode != 0x3c /* cmp $imm, %acc */
6946 || i.dir_encoding == dir_encoding_load))
6947 continue;
6948
6949 if (t->base_opcode == 0xa8 /* test $imm, %acc */
6950 && i.dir_encoding == dir_encoding_load)
6951 continue;
e3669c7f 6952 }
f5eb1d70
JB
6953 /* Fall through. */
6954
6955 case 3:
3ac21baa
JB
6956 if (!(size_match & MATCH_STRAIGHT))
6957 goto check_reverse;
64c49ab3
JB
6958 /* Reverse direction of operands if swapping is possible in the first
6959 place (operands need to be symmetric) and
6960 - the load form is requested, and the template is a store form,
6961 - the store form is requested, and the template is a load form,
6962 - the non-default (swapped) form is requested. */
6963 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
f5eb1d70 6964 if (t->opcode_modifier.d && i.reg_operands == i.operands
64c49ab3
JB
6965 && !operand_type_all_zero (&overlap1))
6966 switch (i.dir_encoding)
6967 {
6968 case dir_encoding_load:
6969 if (operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6970 || t->opcode_modifier.regmem)
64c49ab3
JB
6971 goto check_reverse;
6972 break;
6973
6974 case dir_encoding_store:
6975 if (!operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6976 && !t->opcode_modifier.regmem)
64c49ab3
JB
6977 goto check_reverse;
6978 break;
6979
6980 case dir_encoding_swap:
6981 goto check_reverse;
6982
6983 case dir_encoding_default:
6984 break;
6985 }
86fa6981 6986 /* If we want store form, we skip the current load. */
64c49ab3
JB
6987 if ((i.dir_encoding == dir_encoding_store
6988 || i.dir_encoding == dir_encoding_swap)
86fa6981
L
6989 && i.mem_operands == 0
6990 && t->opcode_modifier.load)
fa99fab2 6991 continue;
1a0670f3 6992 /* Fall through. */
f48ff2ae 6993 case 4:
c0f3af97 6994 case 5:
c6fb90c8 6995 overlap1 = operand_type_and (i.types[1], operand_types[1]);
40fb9820
L
6996 if (!operand_type_match (overlap0, i.types[0])
6997 || !operand_type_match (overlap1, i.types[1])
e2195274 6998 || ((check_register & 3) == 3
dc821c5f 6999 && !operand_type_register_match (i.types[0],
40fb9820 7000 operand_types[0],
dc821c5f 7001 i.types[1],
40fb9820 7002 operand_types[1])))
29b0f896 7003 {
7b94647a
JB
7004 specific_error = progress (i.error);
7005
29b0f896 7006 /* Check if other direction is valid ... */
38e314eb 7007 if (!t->opcode_modifier.d)
29b0f896
AM
7008 continue;
7009
dc1e8a47 7010 check_reverse:
3ac21baa
JB
7011 if (!(size_match & MATCH_REVERSE))
7012 continue;
29b0f896 7013 /* Try reversing direction of operands. */
aa180741 7014 j = t->cpu_flags.bitfield.cpufma4
5dab1799 7015 || t->cpu_flags.bitfield.cpuxop ? 1 : i.operands - 1;
8bd915b7
JB
7016 overlap0 = operand_type_and (i.types[0], operand_types[j]);
7017 overlap1 = operand_type_and (i.types[j], operand_types[0]);
c975cec5
JB
7018 overlap2 = operand_type_and (i.types[1], operand_types[1]);
7019 gas_assert (t->operands != 3 || !check_register);
40fb9820 7020 if (!operand_type_match (overlap0, i.types[0])
8bd915b7 7021 || !operand_type_match (overlap1, i.types[j])
c975cec5
JB
7022 || (t->operands == 3
7023 && !operand_type_match (overlap2, i.types[1]))
45664ddb 7024 || (check_register
dc821c5f 7025 && !operand_type_register_match (i.types[0],
8bd915b7
JB
7026 operand_types[j],
7027 i.types[j],
45664ddb 7028 operand_types[0])))
29b0f896
AM
7029 {
7030 /* Does not match either direction. */
7b94647a 7031 specific_error = progress (i.error);
29b0f896
AM
7032 continue;
7033 }
ac9226cf 7034 /* found_reverse_match holds which variant of D
29b0f896 7035 we've found. */
38e314eb
JB
7036 if (!t->opcode_modifier.d)
7037 found_reverse_match = 0;
7038 else if (operand_types[0].bitfield.tbyte)
ac9226cf 7039 {
4943d587
JB
7040 if (t->opcode_modifier.operandconstraint != UGH)
7041 found_reverse_match = Opcode_FloatD;
bd782808
JB
7042 else
7043 found_reverse_match = ~0;
ac9226cf 7044 /* FSUB{,R} and FDIV{,R} may need a 2nd bit flipped. */
bd782808 7045 if ((t->extension_opcode & 4)
ac9226cf
JB
7046 && (intel_syntax || intel_mnemonic))
7047 found_reverse_match |= Opcode_FloatR;
7048 }
aa180741 7049 else if (t->cpu_flags.bitfield.cpufma4
5dab1799 7050 || t->cpu_flags.bitfield.cpuxop)
8bd915b7
JB
7051 {
7052 found_reverse_match = Opcode_VexW;
7053 goto check_operands_345;
7054 }
ddb62495
JB
7055 else if (t->opcode_space != SPACE_BASE
7056 && (t->opcode_space != SPACE_0F
2c735193
JB
7057 /* MOV to/from CR/DR/TR, as an exception, follow
7058 the base opcode space encoding model. */
7059 || (t->base_opcode | 7) != 0x27))
dbbc8b7e 7060 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
2c735193 7061 ? Opcode_ExtD : Opcode_SIMD_IntD;
a33ef3c2 7062 else if (!t->opcode_modifier.commutative)
38e314eb 7063 found_reverse_match = Opcode_D;
a33ef3c2
JB
7064 else
7065 found_reverse_match = ~0;
29b0f896 7066 }
f48ff2ae 7067 else
29b0f896 7068 {
f48ff2ae 7069 /* Found a forward 2 operand match here. */
8bd915b7 7070 check_operands_345:
d1cbb4db
L
7071 switch (t->operands)
7072 {
c0f3af97 7073 case 5:
3d0738af 7074 overlap4 = operand_type_and (i.types[4], operand_types[4]);
c0f3af97 7075 if (!operand_type_match (overlap4, i.types[4])
dc821c5f 7076 || !operand_type_register_match (i.types[3],
c0f3af97 7077 operand_types[3],
c0f3af97
L
7078 i.types[4],
7079 operand_types[4]))
7b94647a
JB
7080 {
7081 specific_error = progress (i.error);
7082 continue;
7083 }
1a0670f3 7084 /* Fall through. */
f48ff2ae 7085 case 4:
3d0738af 7086 overlap3 = operand_type_and (i.types[3], operand_types[3]);
40fb9820 7087 if (!operand_type_match (overlap3, i.types[3])
e2195274
JB
7088 || ((check_register & 0xa) == 0xa
7089 && !operand_type_register_match (i.types[1],
f7768225
JB
7090 operand_types[1],
7091 i.types[3],
e2195274
JB
7092 operand_types[3]))
7093 || ((check_register & 0xc) == 0xc
7094 && !operand_type_register_match (i.types[2],
7095 operand_types[2],
7096 i.types[3],
7097 operand_types[3])))
7b94647a
JB
7098 {
7099 specific_error = progress (i.error);
7100 continue;
7101 }
1a0670f3 7102 /* Fall through. */
f48ff2ae 7103 case 3:
3d0738af 7104 overlap2 = operand_type_and (i.types[2], operand_types[2]);
40fb9820 7105 if (!operand_type_match (overlap2, i.types[2])
e2195274
JB
7106 || ((check_register & 5) == 5
7107 && !operand_type_register_match (i.types[0],
23e42951
JB
7108 operand_types[0],
7109 i.types[2],
e2195274
JB
7110 operand_types[2]))
7111 || ((check_register & 6) == 6
7112 && !operand_type_register_match (i.types[1],
7113 operand_types[1],
7114 i.types[2],
7115 operand_types[2])))
7b94647a
JB
7116 {
7117 specific_error = progress (i.error);
7118 continue;
7119 }
f48ff2ae
L
7120 break;
7121 }
29b0f896 7122 }
f48ff2ae 7123 /* Found either forward/reverse 2, 3 or 4 operand match here:
29b0f896
AM
7124 slip through to break. */
7125 }
c0f3af97 7126
9bb4d860
L
7127 /* Check if VEX/EVEX encoding requirements can be satisfied. */
7128 if (VEX_check_encoding (t))
da4977e0 7129 {
7b94647a 7130 specific_error = progress (i.error);
da4977e0
JB
7131 continue;
7132 }
7133
9bb4d860
L
7134 /* Check if vector operands are valid. */
7135 if (check_VecOperands (t))
5614d22c 7136 {
7b94647a 7137 specific_error = progress (i.error);
5614d22c
JB
7138 continue;
7139 }
a683cc34 7140
29b0f896
AM
7141 /* We've found a match; break out of loop. */
7142 break;
7143 }
7144
7b94647a
JB
7145#undef progress
7146
29b0f896
AM
7147 if (t == current_templates->end)
7148 {
7149 /* We found no match. */
04784e33 7150 i.error = specific_error;
fa99fab2 7151 return NULL;
29b0f896 7152 }
252b5132 7153
29b0f896
AM
7154 if (!quiet_warnings)
7155 {
7156 if (!intel_syntax
0cfa3eb3 7157 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
76d3f746 7158 as_warn (_("indirect %s without `*'"), insn_name (t));
29b0f896 7159
40fb9820 7160 if (t->opcode_modifier.isprefix
3cd7f3e3 7161 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
7162 {
7163 /* Warn them that a data or address size prefix doesn't
7164 affect assembly of the next line of code. */
76d3f746 7165 as_warn (_("stand-alone `%s' prefix"), insn_name (t));
29b0f896
AM
7166 }
7167 }
7168
7169 /* Copy the template we found. */
9a182d04 7170 install_template (t);
539e75ad
L
7171
7172 if (addr_prefix_disp != -1)
7173 i.tm.operand_types[addr_prefix_disp]
7174 = operand_types[addr_prefix_disp];
7175
8bd915b7 7176 switch (found_reverse_match)
29b0f896 7177 {
8bd915b7
JB
7178 case 0:
7179 break;
7180
bd782808
JB
7181 case Opcode_FloatR:
7182 case Opcode_FloatR | Opcode_FloatD:
7183 i.tm.extension_opcode ^= Opcode_FloatR >> 3;
7184 found_reverse_match &= Opcode_FloatD;
7185
7186 /* Fall through. */
8bd915b7 7187 default:
dfd69174
JB
7188 /* If we found a reverse match we must alter the opcode direction
7189 bit and clear/flip the regmem modifier one. found_reverse_match
7190 holds bits to change (different for int & float insns). */
29b0f896
AM
7191
7192 i.tm.base_opcode ^= found_reverse_match;
7193
dfd69174
JB
7194 /* Certain SIMD insns have their load forms specified in the opcode
7195 table, and hence we need to _set_ RegMem instead of clearing it.
7196 We need to avoid setting the bit though on insns like KMOVW. */
7197 i.tm.opcode_modifier.regmem
7198 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
7199 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
7200 && !i.tm.opcode_modifier.regmem;
a33ef3c2
JB
7201
7202 /* Fall through. */
7203 case ~0:
7204 i.tm.operand_types[0] = operand_types[i.operands - 1];
7205 i.tm.operand_types[i.operands - 1] = operand_types[0];
8bd915b7
JB
7206 break;
7207
7208 case Opcode_VexW:
7209 /* Only the first two register operands need reversing, alongside
7210 flipping VEX.W. */
7211 i.tm.opcode_modifier.vexw ^= VEXW0 ^ VEXW1;
7212
7213 j = i.tm.operand_types[0].bitfield.imm8;
7214 i.tm.operand_types[j] = operand_types[j + 1];
7215 i.tm.operand_types[j + 1] = operand_types[j];
7216 break;
29b0f896
AM
7217 }
7218
fa99fab2 7219 return t;
29b0f896
AM
7220}
7221
7222static int
e3bb37b5 7223check_string (void)
29b0f896 7224{
51c8edf6
JB
7225 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
7226 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
8dc0818e 7227
5e042380 7228 if (i.seg[op] != NULL && i.seg[op] != reg_es)
29b0f896 7229 {
51c8edf6 7230 as_bad (_("`%s' operand %u must use `%ses' segment"),
76d3f746 7231 insn_name (&i.tm),
51c8edf6
JB
7232 intel_syntax ? i.tm.operands - es_op : es_op + 1,
7233 register_prefix);
7234 return 0;
29b0f896 7235 }
51c8edf6
JB
7236
7237 /* There's only ever one segment override allowed per instruction.
7238 This instruction possibly has a legal segment override on the
7239 second operand, so copy the segment to where non-string
7240 instructions store it, allowing common code. */
7241 i.seg[op] = i.seg[1];
7242
29b0f896
AM
7243 return 1;
7244}
7245
7246static int
543613e9 7247process_suffix (void)
29b0f896 7248{
7fc69528 7249 bool is_movx = false;
8b65b895 7250
29b0f896
AM
7251 /* If matched instruction specifies an explicit instruction mnemonic
7252 suffix, use it. */
673fe0f0 7253 if (i.tm.opcode_modifier.size == SIZE16)
40fb9820 7254 i.suffix = WORD_MNEM_SUFFIX;
673fe0f0 7255 else if (i.tm.opcode_modifier.size == SIZE32)
40fb9820 7256 i.suffix = LONG_MNEM_SUFFIX;
673fe0f0 7257 else if (i.tm.opcode_modifier.size == SIZE64)
40fb9820 7258 i.suffix = QWORD_MNEM_SUFFIX;
13e600d0 7259 else if (i.reg_operands
c8f8eebc 7260 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
255571cd 7261 && i.tm.opcode_modifier.operandconstraint != ADDR_PREFIX_OP_REG)
29b0f896 7262 {
65fca059 7263 unsigned int numop = i.operands;
389d00a5
JB
7264
7265 /* MOVSX/MOVZX */
ddb62495 7266 is_movx = (i.tm.opcode_space == SPACE_0F
389d00a5 7267 && (i.tm.base_opcode | 8) == 0xbe)
ddb62495 7268 || (i.tm.opcode_space == SPACE_BASE
389d00a5
JB
7269 && i.tm.base_opcode == 0x63
7270 && i.tm.cpu_flags.bitfield.cpu64);
7271
65fca059
JB
7272 /* movsx/movzx want only their source operand considered here, for the
7273 ambiguity checking below. The suffix will be replaced afterwards
7274 to represent the destination (register). */
389d00a5 7275 if (is_movx && (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63))
65fca059
JB
7276 --i.operands;
7277
643bb870 7278 /* crc32 needs REX.W set regardless of suffix / source operand size. */
7fc69528 7279 if (i.tm.mnem_off == MN_crc32 && i.tm.operand_types[1].bitfield.qword)
643bb870
JB
7280 i.rex |= REX_W;
7281
29b0f896 7282 /* If there's no instruction mnemonic suffix we try to invent one
13e600d0 7283 based on GPR operands. */
29b0f896
AM
7284 if (!i.suffix)
7285 {
7286 /* We take i.suffix from the last register operand specified,
7287 Destination register type is more significant than source
381d071f
L
7288 register type. crc32 in SSE4.2 prefers source register
7289 type. */
7fc69528 7290 unsigned int op = i.tm.mnem_off == MN_crc32 ? 1 : i.operands;
20592a94 7291
1a035124
JB
7292 while (op--)
7293 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
7294 || i.tm.operand_types[op].bitfield.instance == Accum)
7295 {
7296 if (i.types[op].bitfield.class != Reg)
7297 continue;
7298 if (i.types[op].bitfield.byte)
7299 i.suffix = BYTE_MNEM_SUFFIX;
7300 else if (i.types[op].bitfield.word)
7301 i.suffix = WORD_MNEM_SUFFIX;
7302 else if (i.types[op].bitfield.dword)
7303 i.suffix = LONG_MNEM_SUFFIX;
7304 else if (i.types[op].bitfield.qword)
7305 i.suffix = QWORD_MNEM_SUFFIX;
7306 else
7307 continue;
7308 break;
7309 }
65fca059
JB
7310
7311 /* As an exception, movsx/movzx silently default to a byte source
7312 in AT&T mode. */
389d00a5 7313 if (is_movx && i.tm.opcode_modifier.w && !i.suffix && !intel_syntax)
65fca059 7314 i.suffix = BYTE_MNEM_SUFFIX;
29b0f896
AM
7315 }
7316 else if (i.suffix == BYTE_MNEM_SUFFIX)
7317 {
1cb0ab18 7318 if (!check_byte_reg ())
29b0f896
AM
7319 return 0;
7320 }
7321 else if (i.suffix == LONG_MNEM_SUFFIX)
7322 {
1cb0ab18 7323 if (!check_long_reg ())
29b0f896
AM
7324 return 0;
7325 }
7326 else if (i.suffix == QWORD_MNEM_SUFFIX)
7327 {
1cb0ab18 7328 if (!check_qword_reg ())
29b0f896
AM
7329 return 0;
7330 }
7331 else if (i.suffix == WORD_MNEM_SUFFIX)
7332 {
1cb0ab18 7333 if (!check_word_reg ())
29b0f896
AM
7334 return 0;
7335 }
3cd7f3e3
L
7336 else if (intel_syntax
7337 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
7338 /* Do nothing if the instruction is going to ignore the prefix. */
7339 ;
7340 else
7341 abort ();
65fca059
JB
7342
7343 /* Undo the movsx/movzx change done above. */
7344 i.operands = numop;
29b0f896 7345 }
3cd7f3e3
L
7346 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
7347 && !i.suffix)
29b0f896 7348 {
13e600d0
JB
7349 i.suffix = stackop_size;
7350 if (stackop_size == LONG_MNEM_SUFFIX)
06f74c5c
L
7351 {
7352 /* stackop_size is set to LONG_MNEM_SUFFIX for the
7353 .code16gcc directive to support 16-bit mode with
7354 32-bit address. For IRET without a suffix, generate
7355 16-bit IRET (opcode 0xcf) to return from an interrupt
7356 handler. */
13e600d0
JB
7357 if (i.tm.base_opcode == 0xcf)
7358 {
7359 i.suffix = WORD_MNEM_SUFFIX;
7360 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
7361 }
7362 /* Warn about changed behavior for segment register push/pop. */
7363 else if ((i.tm.base_opcode | 1) == 0x07)
7364 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
76d3f746 7365 insn_name (&i.tm));
06f74c5c 7366 }
29b0f896 7367 }
c006a730 7368 else if (!i.suffix
0cfa3eb3
JB
7369 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
7370 || i.tm.opcode_modifier.jump == JUMP_BYTE
7371 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
ddb62495 7372 || (i.tm.opcode_space == SPACE_0F
389d00a5 7373 && i.tm.base_opcode == 0x01 /* [ls][gi]dt */
64e74474 7374 && i.tm.extension_opcode <= 3)))
9306ca4a
JB
7375 {
7376 switch (flag_code)
7377 {
7378 case CODE_64BIT:
40fb9820 7379 if (!i.tm.opcode_modifier.no_qsuf)
9306ca4a 7380 {
828c2a25
JB
7381 if (i.tm.opcode_modifier.jump == JUMP_BYTE
7382 || i.tm.opcode_modifier.no_lsuf)
7383 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a
JB
7384 break;
7385 }
1a0670f3 7386 /* Fall through. */
9306ca4a 7387 case CODE_32BIT:
40fb9820 7388 if (!i.tm.opcode_modifier.no_lsuf)
9306ca4a
JB
7389 i.suffix = LONG_MNEM_SUFFIX;
7390 break;
7391 case CODE_16BIT:
40fb9820 7392 if (!i.tm.opcode_modifier.no_wsuf)
9306ca4a
JB
7393 i.suffix = WORD_MNEM_SUFFIX;
7394 break;
7395 }
7396 }
252b5132 7397
c006a730 7398 if (!i.suffix
3cd7f3e3 7399 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8
JB
7400 /* Also cover lret/retf/iret in 64-bit mode. */
7401 || (flag_code == CODE_64BIT
7402 && !i.tm.opcode_modifier.no_lsuf
7403 && !i.tm.opcode_modifier.no_qsuf))
3cd7f3e3 7404 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
8bbb3ad8
JB
7405 /* Explicit sizing prefixes are assumed to disambiguate insns. */
7406 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
62b3f548
JB
7407 /* Accept FLDENV et al without suffix. */
7408 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
29b0f896 7409 {
6c0946d0 7410 unsigned int suffixes, evex = 0;
c006a730
JB
7411
7412 suffixes = !i.tm.opcode_modifier.no_bsuf;
7413 if (!i.tm.opcode_modifier.no_wsuf)
7414 suffixes |= 1 << 1;
7415 if (!i.tm.opcode_modifier.no_lsuf)
7416 suffixes |= 1 << 2;
c006a730
JB
7417 if (!i.tm.opcode_modifier.no_ssuf)
7418 suffixes |= 1 << 4;
7419 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
7420 suffixes |= 1 << 5;
7421
6c0946d0
JB
7422 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
7423 also suitable for AT&T syntax mode, it was requested that this be
7424 restricted to just Intel syntax. */
a5748e0d
JB
7425 if (intel_syntax && is_any_vex_encoding (&i.tm)
7426 && !i.broadcast.type && !i.broadcast.bytes)
6c0946d0 7427 {
b9915cbc 7428 unsigned int op;
6c0946d0 7429
b9915cbc 7430 for (op = 0; op < i.tm.operands; ++op)
6c0946d0 7431 {
b9915cbc
JB
7432 if (is_evex_encoding (&i.tm)
7433 && !cpu_arch_flags.bitfield.cpuavx512vl)
6c0946d0 7434 {
b9915cbc
JB
7435 if (i.tm.operand_types[op].bitfield.ymmword)
7436 i.tm.operand_types[op].bitfield.xmmword = 0;
7437 if (i.tm.operand_types[op].bitfield.zmmword)
7438 i.tm.operand_types[op].bitfield.ymmword = 0;
7439 if (!i.tm.opcode_modifier.evex
7440 || i.tm.opcode_modifier.evex == EVEXDYN)
7441 i.tm.opcode_modifier.evex = EVEX512;
7442 }
6c0946d0 7443
b9915cbc
JB
7444 if (i.tm.operand_types[op].bitfield.xmmword
7445 + i.tm.operand_types[op].bitfield.ymmword
7446 + i.tm.operand_types[op].bitfield.zmmword < 2)
7447 continue;
6c0946d0 7448
b9915cbc
JB
7449 /* Any properly sized operand disambiguates the insn. */
7450 if (i.types[op].bitfield.xmmword
7451 || i.types[op].bitfield.ymmword
7452 || i.types[op].bitfield.zmmword)
7453 {
7454 suffixes &= ~(7 << 6);
7455 evex = 0;
7456 break;
7457 }
6c0946d0 7458
b9915cbc
JB
7459 if ((i.flags[op] & Operand_Mem)
7460 && i.tm.operand_types[op].bitfield.unspecified)
7461 {
7462 if (i.tm.operand_types[op].bitfield.xmmword)
7463 suffixes |= 1 << 6;
7464 if (i.tm.operand_types[op].bitfield.ymmword)
7465 suffixes |= 1 << 7;
7466 if (i.tm.operand_types[op].bitfield.zmmword)
7467 suffixes |= 1 << 8;
7468 if (is_evex_encoding (&i.tm))
7469 evex = EVEX512;
6c0946d0
JB
7470 }
7471 }
7472 }
7473
7474 /* Are multiple suffixes / operand sizes allowed? */
c006a730 7475 if (suffixes & (suffixes - 1))
9306ca4a 7476 {
873494c8 7477 if (intel_syntax
3cd7f3e3 7478 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8 7479 || operand_check == check_error))
9306ca4a 7480 {
76d3f746 7481 as_bad (_("ambiguous operand size for `%s'"), insn_name (&i.tm));
9306ca4a
JB
7482 return 0;
7483 }
c006a730 7484 if (operand_check == check_error)
9306ca4a 7485 {
c006a730 7486 as_bad (_("no instruction mnemonic suffix given and "
76d3f746 7487 "no register operands; can't size `%s'"), insn_name (&i.tm));
9306ca4a
JB
7488 return 0;
7489 }
c006a730 7490 if (operand_check == check_warning)
873494c8
JB
7491 as_warn (_("%s; using default for `%s'"),
7492 intel_syntax
7493 ? _("ambiguous operand size")
7494 : _("no instruction mnemonic suffix given and "
7495 "no register operands"),
76d3f746 7496 insn_name (&i.tm));
c006a730
JB
7497
7498 if (i.tm.opcode_modifier.floatmf)
7499 i.suffix = SHORT_MNEM_SUFFIX;
389d00a5 7500 else if (is_movx)
65fca059 7501 /* handled below */;
6c0946d0
JB
7502 else if (evex)
7503 i.tm.opcode_modifier.evex = evex;
c006a730
JB
7504 else if (flag_code == CODE_16BIT)
7505 i.suffix = WORD_MNEM_SUFFIX;
1a035124 7506 else if (!i.tm.opcode_modifier.no_lsuf)
c006a730 7507 i.suffix = LONG_MNEM_SUFFIX;
1a035124
JB
7508 else
7509 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a 7510 }
29b0f896 7511 }
252b5132 7512
389d00a5 7513 if (is_movx)
65fca059
JB
7514 {
7515 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7516 In AT&T syntax, if there is no suffix (warned about above), the default
7517 will be byte extension. */
7518 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7519 i.tm.base_opcode |= 1;
7520
7521 /* For further processing, the suffix should represent the destination
7522 (register). This is already the case when one was used with
7523 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7524 no suffix to begin with. */
7525 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7526 {
7527 if (i.types[1].bitfield.word)
7528 i.suffix = WORD_MNEM_SUFFIX;
7529 else if (i.types[1].bitfield.qword)
7530 i.suffix = QWORD_MNEM_SUFFIX;
7531 else
7532 i.suffix = LONG_MNEM_SUFFIX;
7533
7534 i.tm.opcode_modifier.w = 0;
7535 }
7536 }
7537
50128d0c
JB
7538 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7539 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7540 != (i.tm.operand_types[1].bitfield.class == Reg);
7541
d2224064
JB
7542 /* Change the opcode based on the operand size given by i.suffix. */
7543 switch (i.suffix)
29b0f896 7544 {
d2224064
JB
7545 /* Size floating point instruction. */
7546 case LONG_MNEM_SUFFIX:
7547 if (i.tm.opcode_modifier.floatmf)
7548 {
7549 i.tm.base_opcode ^= 4;
7550 break;
7551 }
7552 /* fall through */
7553 case WORD_MNEM_SUFFIX:
7554 case QWORD_MNEM_SUFFIX:
29b0f896 7555 /* It's not a byte, select word/dword operation. */
40fb9820 7556 if (i.tm.opcode_modifier.w)
29b0f896 7557 {
50128d0c 7558 if (i.short_form)
29b0f896
AM
7559 i.tm.base_opcode |= 8;
7560 else
7561 i.tm.base_opcode |= 1;
7562 }
d2224064
JB
7563 /* fall through */
7564 case SHORT_MNEM_SUFFIX:
29b0f896
AM
7565 /* Now select between word & dword operations via the operand
7566 size prefix, except for instructions that will ignore this
7567 prefix anyway. */
c8f8eebc 7568 if (i.suffix != QWORD_MNEM_SUFFIX
3cd7f3e3 7569 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
c8f8eebc
JB
7570 && !i.tm.opcode_modifier.floatmf
7571 && !is_any_vex_encoding (&i.tm)
7572 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7573 || (flag_code == CODE_64BIT
7574 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
24eab124
AM
7575 {
7576 unsigned int prefix = DATA_PREFIX_OPCODE;
543613e9 7577
0cfa3eb3 7578 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
29b0f896 7579 prefix = ADDR_PREFIX_OPCODE;
252b5132 7580
29b0f896
AM
7581 if (!add_prefix (prefix))
7582 return 0;
24eab124 7583 }
252b5132 7584
29b0f896
AM
7585 /* Set mode64 for an operand. */
7586 if (i.suffix == QWORD_MNEM_SUFFIX
9146926a 7587 && flag_code == CODE_64BIT
d2224064 7588 && !i.tm.opcode_modifier.norex64
4ed21b58 7589 && !i.tm.opcode_modifier.vexw
46e883c5 7590 /* Special case for xchg %rax,%rax. It is NOP and doesn't
d2224064
JB
7591 need rex64. */
7592 && ! (i.operands == 2
7593 && i.tm.base_opcode == 0x90
ddb62495 7594 && i.tm.opcode_space == SPACE_BASE
75e5731b
JB
7595 && i.types[0].bitfield.instance == Accum
7596 && i.types[0].bitfield.qword
44732014 7597 && i.types[1].bitfield.instance == Accum))
d2224064 7598 i.rex |= REX_W;
3e73aa7c 7599
d2224064 7600 break;
8bbb3ad8
JB
7601
7602 case 0:
f9a6a8f0 7603 /* Select word/dword/qword operation with explicit data sizing prefix
8bbb3ad8
JB
7604 when there are no suitable register operands. */
7605 if (i.tm.opcode_modifier.w
7606 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7607 && (!i.reg_operands
7608 || (i.reg_operands == 1
7609 /* ShiftCount */
7610 && (i.tm.operand_types[0].bitfield.instance == RegC
7611 /* InOutPortReg */
7612 || i.tm.operand_types[0].bitfield.instance == RegD
7613 || i.tm.operand_types[1].bitfield.instance == RegD
7fc69528 7614 || i.tm.mnem_off == MN_crc32))))
8bbb3ad8
JB
7615 i.tm.base_opcode |= 1;
7616 break;
29b0f896 7617 }
7ecd2f8b 7618
255571cd 7619 if (i.tm.opcode_modifier.operandconstraint == ADDR_PREFIX_OP_REG)
c0a30a9f 7620 {
c8f8eebc
JB
7621 gas_assert (!i.suffix);
7622 gas_assert (i.reg_operands);
c0a30a9f 7623
c8f8eebc
JB
7624 if (i.tm.operand_types[0].bitfield.instance == Accum
7625 || i.operands == 1)
7626 {
7627 /* The address size override prefix changes the size of the
7628 first operand. */
7629 if (flag_code == CODE_64BIT
7630 && i.op[0].regs->reg_type.bitfield.word)
7631 {
7632 as_bad (_("16-bit addressing unavailable for `%s'"),
76d3f746 7633 insn_name (&i.tm));
c8f8eebc
JB
7634 return 0;
7635 }
7636
7637 if ((flag_code == CODE_32BIT
7638 ? i.op[0].regs->reg_type.bitfield.word
7639 : i.op[0].regs->reg_type.bitfield.dword)
7640 && !add_prefix (ADDR_PREFIX_OPCODE))
7641 return 0;
7642 }
c0a30a9f
L
7643 else
7644 {
c8f8eebc
JB
7645 /* Check invalid register operand when the address size override
7646 prefix changes the size of register operands. */
7647 unsigned int op;
7648 enum { need_word, need_dword, need_qword } need;
7649
27f13469 7650 /* Check the register operand for the address size prefix if
b3a3496f 7651 the memory operand has no real registers, like symbol, DISP
829f3fe1 7652 or bogus (x32-only) symbol(%rip) when symbol(%eip) is meant. */
27f13469
L
7653 if (i.mem_operands == 1
7654 && i.reg_operands == 1
7655 && i.operands == 2
27f13469 7656 && i.types[1].bitfield.class == Reg
b3a3496f
L
7657 && (flag_code == CODE_32BIT
7658 ? i.op[1].regs->reg_type.bitfield.word
7659 : i.op[1].regs->reg_type.bitfield.dword)
7660 && ((i.base_reg == NULL && i.index_reg == NULL)
829f3fe1
JB
7661#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7662 || (x86_elf_abi == X86_64_X32_ABI
7663 && i.base_reg
b3a3496f
L
7664 && i.base_reg->reg_num == RegIP
7665 && i.base_reg->reg_type.bitfield.qword))
829f3fe1
JB
7666#else
7667 || 0)
7668#endif
27f13469
L
7669 && !add_prefix (ADDR_PREFIX_OPCODE))
7670 return 0;
7671
c8f8eebc
JB
7672 if (flag_code == CODE_32BIT)
7673 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7674 else if (i.prefix[ADDR_PREFIX])
c0a30a9f
L
7675 need = need_dword;
7676 else
7677 need = flag_code == CODE_64BIT ? need_qword : need_word;
c0a30a9f 7678
c8f8eebc
JB
7679 for (op = 0; op < i.operands; op++)
7680 {
7681 if (i.types[op].bitfield.class != Reg)
7682 continue;
7683
7684 switch (need)
7685 {
7686 case need_word:
7687 if (i.op[op].regs->reg_type.bitfield.word)
7688 continue;
7689 break;
7690 case need_dword:
7691 if (i.op[op].regs->reg_type.bitfield.dword)
7692 continue;
7693 break;
7694 case need_qword:
7695 if (i.op[op].regs->reg_type.bitfield.qword)
7696 continue;
7697 break;
7698 }
7699
7700 as_bad (_("invalid register operand size for `%s'"),
76d3f746 7701 insn_name (&i.tm));
c8f8eebc
JB
7702 return 0;
7703 }
7704 }
c0a30a9f
L
7705 }
7706
29b0f896
AM
7707 return 1;
7708}
3e73aa7c 7709
29b0f896 7710static int
543613e9 7711check_byte_reg (void)
29b0f896
AM
7712{
7713 int op;
543613e9 7714
29b0f896
AM
7715 for (op = i.operands; --op >= 0;)
7716 {
dc821c5f 7717 /* Skip non-register operands. */
bab6aec1 7718 if (i.types[op].bitfield.class != Reg)
dc821c5f
JB
7719 continue;
7720
29b0f896
AM
7721 /* If this is an eight bit register, it's OK. If it's the 16 or
7722 32 bit version of an eight bit register, we will just use the
7723 low portion, and that's OK too. */
dc821c5f 7724 if (i.types[op].bitfield.byte)
29b0f896
AM
7725 continue;
7726
5a819eb9 7727 /* I/O port address operands are OK too. */
75e5731b
JB
7728 if (i.tm.operand_types[op].bitfield.instance == RegD
7729 && i.tm.operand_types[op].bitfield.word)
5a819eb9
JB
7730 continue;
7731
9706160a 7732 /* crc32 only wants its source operand checked here. */
7fc69528 7733 if (i.tm.mnem_off == MN_crc32 && op != 0)
9344ff29
L
7734 continue;
7735
29b0f896 7736 /* Any other register is bad. */
73c76375
JB
7737 as_bad (_("`%s%s' not allowed with `%s%c'"),
7738 register_prefix, i.op[op].regs->reg_name,
76d3f746 7739 insn_name (&i.tm), i.suffix);
73c76375 7740 return 0;
29b0f896
AM
7741 }
7742 return 1;
7743}
7744
7745static int
e3bb37b5 7746check_long_reg (void)
29b0f896
AM
7747{
7748 int op;
7749
7750 for (op = i.operands; --op >= 0;)
dc821c5f 7751 /* Skip non-register operands. */
bab6aec1 7752 if (i.types[op].bitfield.class != Reg)
dc821c5f 7753 continue;
29b0f896
AM
7754 /* Reject eight bit registers, except where the template requires
7755 them. (eg. movzb) */
dc821c5f 7756 else if (i.types[op].bitfield.byte
bab6aec1 7757 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7758 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7759 && (i.tm.operand_types[op].bitfield.word
7760 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7761 {
a540244d
L
7762 as_bad (_("`%s%s' not allowed with `%s%c'"),
7763 register_prefix,
29b0f896 7764 i.op[op].regs->reg_name,
76d3f746 7765 insn_name (&i.tm),
29b0f896
AM
7766 i.suffix);
7767 return 0;
7768 }
be4c5e58
L
7769 /* Error if the e prefix on a general reg is missing. */
7770 else if (i.types[op].bitfield.word
bab6aec1 7771 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7772 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7773 && i.tm.operand_types[op].bitfield.dword)
29b0f896 7774 {
be4c5e58
L
7775 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7776 register_prefix, i.op[op].regs->reg_name,
7777 i.suffix);
7778 return 0;
252b5132 7779 }
e4630f71 7780 /* Warn if the r prefix on a general reg is present. */
dc821c5f 7781 else if (i.types[op].bitfield.qword
bab6aec1 7782 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7783 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7784 && i.tm.operand_types[op].bitfield.dword)
252b5132 7785 {
1cb0ab18
JB
7786 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7787 register_prefix, i.op[op].regs->reg_name, i.suffix);
7788 return 0;
29b0f896
AM
7789 }
7790 return 1;
7791}
252b5132 7792
29b0f896 7793static int
e3bb37b5 7794check_qword_reg (void)
29b0f896
AM
7795{
7796 int op;
252b5132 7797
29b0f896 7798 for (op = i.operands; --op >= 0; )
dc821c5f 7799 /* Skip non-register operands. */
bab6aec1 7800 if (i.types[op].bitfield.class != Reg)
dc821c5f 7801 continue;
29b0f896
AM
7802 /* Reject eight bit registers, except where the template requires
7803 them. (eg. movzb) */
dc821c5f 7804 else if (i.types[op].bitfield.byte
bab6aec1 7805 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7806 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7807 && (i.tm.operand_types[op].bitfield.word
7808 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7809 {
a540244d
L
7810 as_bad (_("`%s%s' not allowed with `%s%c'"),
7811 register_prefix,
29b0f896 7812 i.op[op].regs->reg_name,
76d3f746 7813 insn_name (&i.tm),
29b0f896
AM
7814 i.suffix);
7815 return 0;
7816 }
e4630f71 7817 /* Warn if the r prefix on a general reg is missing. */
dc821c5f
JB
7818 else if ((i.types[op].bitfield.word
7819 || i.types[op].bitfield.dword)
bab6aec1 7820 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7821 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7822 && i.tm.operand_types[op].bitfield.qword)
29b0f896
AM
7823 {
7824 /* Prohibit these changes in the 64bit mode, since the
7825 lowering is more complicated. */
1cb0ab18
JB
7826 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7827 register_prefix, i.op[op].regs->reg_name, i.suffix);
7828 return 0;
252b5132 7829 }
29b0f896
AM
7830 return 1;
7831}
252b5132 7832
29b0f896 7833static int
e3bb37b5 7834check_word_reg (void)
29b0f896
AM
7835{
7836 int op;
7837 for (op = i.operands; --op >= 0;)
dc821c5f 7838 /* Skip non-register operands. */
bab6aec1 7839 if (i.types[op].bitfield.class != Reg)
dc821c5f 7840 continue;
29b0f896
AM
7841 /* Reject eight bit registers, except where the template requires
7842 them. (eg. movzb) */
dc821c5f 7843 else if (i.types[op].bitfield.byte
bab6aec1 7844 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7845 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7846 && (i.tm.operand_types[op].bitfield.word
7847 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7848 {
a540244d
L
7849 as_bad (_("`%s%s' not allowed with `%s%c'"),
7850 register_prefix,
29b0f896 7851 i.op[op].regs->reg_name,
76d3f746 7852 insn_name (&i.tm),
29b0f896
AM
7853 i.suffix);
7854 return 0;
7855 }
9706160a
JB
7856 /* Error if the e or r prefix on a general reg is present. */
7857 else if ((i.types[op].bitfield.dword
dc821c5f 7858 || i.types[op].bitfield.qword)
bab6aec1 7859 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7860 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7861 && i.tm.operand_types[op].bitfield.word)
252b5132 7862 {
9706160a
JB
7863 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7864 register_prefix, i.op[op].regs->reg_name,
7865 i.suffix);
7866 return 0;
29b0f896
AM
7867 }
7868 return 1;
7869}
252b5132 7870
29b0f896 7871static int
40fb9820 7872update_imm (unsigned int j)
29b0f896 7873{
bc0844ae 7874 i386_operand_type overlap = i.types[j];
c34d1cc9
JB
7875
7876 if (i.tm.operand_types[j].bitfield.imm8
7877 && i.tm.operand_types[j].bitfield.imm8s
7878 && overlap.bitfield.imm8 && overlap.bitfield.imm8s)
7879 {
7880 /* This combination is used on 8-bit immediates where e.g. $~0 is
7881 desirable to permit. We're past operand type matching, so simply
7882 put things back in the shape they were before introducing the
7883 distinction between Imm8, Imm8S, and Imm8|Imm8S. */
7884 overlap.bitfield.imm8s = 0;
7885 }
7886
be1643ff
JB
7887 if (overlap.bitfield.imm8
7888 + overlap.bitfield.imm8s
7889 + overlap.bitfield.imm16
7890 + overlap.bitfield.imm32
7891 + overlap.bitfield.imm32s
7892 + overlap.bitfield.imm64 > 1)
29b0f896 7893 {
05909f23
JB
7894 static const i386_operand_type imm16 = { .bitfield = { .imm16 = 1 } };
7895 static const i386_operand_type imm32 = { .bitfield = { .imm32 = 1 } };
7896 static const i386_operand_type imm32s = { .bitfield = { .imm32s = 1 } };
7897 static const i386_operand_type imm16_32 = { .bitfield =
7898 { .imm16 = 1, .imm32 = 1 }
7899 };
7900 static const i386_operand_type imm16_32s = { .bitfield =
7901 { .imm16 = 1, .imm32s = 1 }
7902 };
7903 static const i386_operand_type imm16_32_32s = { .bitfield =
7904 { .imm16 = 1, .imm32 = 1, .imm32s = 1 }
7905 };
7906
29b0f896
AM
7907 if (i.suffix)
7908 {
40fb9820
L
7909 i386_operand_type temp;
7910
0dfbf9d7 7911 operand_type_set (&temp, 0);
7ab9ffdd 7912 if (i.suffix == BYTE_MNEM_SUFFIX)
40fb9820
L
7913 {
7914 temp.bitfield.imm8 = overlap.bitfield.imm8;
7915 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7916 }
7917 else if (i.suffix == WORD_MNEM_SUFFIX)
7918 temp.bitfield.imm16 = overlap.bitfield.imm16;
7919 else if (i.suffix == QWORD_MNEM_SUFFIX)
7920 {
7921 temp.bitfield.imm64 = overlap.bitfield.imm64;
7922 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7923 }
7924 else
7925 temp.bitfield.imm32 = overlap.bitfield.imm32;
7926 overlap = temp;
29b0f896 7927 }
0dfbf9d7
L
7928 else if (operand_type_equal (&overlap, &imm16_32_32s)
7929 || operand_type_equal (&overlap, &imm16_32)
7930 || operand_type_equal (&overlap, &imm16_32s))
29b0f896 7931 {
40fb9820 7932 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
65da13b5 7933 overlap = imm16;
40fb9820 7934 else
65da13b5 7935 overlap = imm32s;
29b0f896 7936 }
8bbb3ad8
JB
7937 else if (i.prefix[REX_PREFIX] & REX_W)
7938 overlap = operand_type_and (overlap, imm32s);
7939 else if (i.prefix[DATA_PREFIX])
7940 overlap = operand_type_and (overlap,
7941 flag_code != CODE_16BIT ? imm16 : imm32);
be1643ff
JB
7942 if (overlap.bitfield.imm8
7943 + overlap.bitfield.imm8s
7944 + overlap.bitfield.imm16
7945 + overlap.bitfield.imm32
7946 + overlap.bitfield.imm32s
7947 + overlap.bitfield.imm64 != 1)
29b0f896 7948 {
4eed87de
AM
7949 as_bad (_("no instruction mnemonic suffix given; "
7950 "can't determine immediate size"));
29b0f896
AM
7951 return 0;
7952 }
7953 }
40fb9820 7954 i.types[j] = overlap;
29b0f896 7955
40fb9820
L
7956 return 1;
7957}
7958
7959static int
7960finalize_imm (void)
7961{
bc0844ae 7962 unsigned int j, n;
29b0f896 7963
bc0844ae
L
7964 /* Update the first 2 immediate operands. */
7965 n = i.operands > 2 ? 2 : i.operands;
7966 if (n)
7967 {
7968 for (j = 0; j < n; j++)
7969 if (update_imm (j) == 0)
7970 return 0;
40fb9820 7971
bc0844ae
L
7972 /* The 3rd operand can't be immediate operand. */
7973 gas_assert (operand_type_check (i.types[2], imm) == 0);
7974 }
29b0f896
AM
7975
7976 return 1;
7977}
7978
0a3eba42
JB
7979static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7980 bool do_sse2avx)
7981{
7982 if (r->reg_flags & RegRex)
7983 {
7984 if (i.rex & rex_bit)
7985 as_bad (_("same type of prefix used twice"));
7986 i.rex |= rex_bit;
7987 }
7988 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7989 {
7990 gas_assert (i.vex.register_specifier == r);
7991 i.vex.register_specifier += 8;
7992 }
7993
7994 if (r->reg_flags & RegVRex)
7995 i.vrex |= rex_bit;
7996}
7997
29b0f896 7998static int
e3bb37b5 7999process_operands (void)
29b0f896
AM
8000{
8001 /* Default segment register this instruction will use for memory
8002 accesses. 0 means unknown. This is only for optimizing out
8003 unnecessary segment overrides. */
5e042380 8004 const reg_entry *default_seg = NULL;
29b0f896 8005
31b4cda3
JB
8006 /* We only need to check those implicit registers for instructions
8007 with 3 operands or less. */
8008 if (i.operands <= 3)
8009 for (unsigned int j = 0; j < i.operands; j++)
8010 if (i.types[j].bitfield.instance != InstanceNone)
8011 i.reg_operands--;
8012
a5aeccd9
JB
8013 if (i.tm.opcode_modifier.sse2avx)
8014 {
8015 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
8016 need converting. */
8017 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
8018 i.prefix[REX_PREFIX] = 0;
8019 i.rex_encoding = 0;
8020 }
c423d21a
JB
8021 /* ImmExt should be processed after SSE2AVX. */
8022 else if (i.tm.opcode_modifier.immext)
8023 process_immext ();
a5aeccd9 8024
2426c15f 8025 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
29b0f896 8026 {
05909f23
JB
8027 static const i386_operand_type regxmm = {
8028 .bitfield = { .class = RegSIMD, .xmmword = 1 }
8029 };
91d6fa6a
NC
8030 unsigned int dupl = i.operands;
8031 unsigned int dest = dupl - 1;
9fcfb3d7
L
8032 unsigned int j;
8033
c0f3af97 8034 /* The destination must be an xmm register. */
9c2799c2 8035 gas_assert (i.reg_operands
91d6fa6a 8036 && MAX_OPERANDS > dupl
7ab9ffdd 8037 && operand_type_equal (&i.types[dest], &regxmm));
c0f3af97 8038
75e5731b 8039 if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 8040 && i.tm.operand_types[0].bitfield.xmmword)
e2ec9d29 8041 {
95dfdd85
JB
8042 /* Keep xmm0 for instructions with VEX prefix and 3
8043 sources. */
8044 i.tm.operand_types[0].bitfield.instance = InstanceNone;
8045 i.tm.operand_types[0].bitfield.class = RegSIMD;
31b4cda3 8046 i.reg_operands++;
95dfdd85 8047 goto duplicate;
c0f3af97 8048 }
95dfdd85
JB
8049
8050 if (i.tm.opcode_modifier.operandconstraint == IMPLICIT_1ST_XMM0)
7ab9ffdd 8051 {
aa180741 8052 gas_assert ((MAX_OPERANDS - 1) > dupl);
c0f3af97
L
8053
8054 /* Add the implicit xmm0 for instructions with VEX prefix
8055 and 3 sources. */
8056 for (j = i.operands; j > 0; j--)
8057 {
8058 i.op[j] = i.op[j - 1];
8059 i.types[j] = i.types[j - 1];
8060 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
8dc0818e 8061 i.flags[j] = i.flags[j - 1];
c0f3af97
L
8062 }
8063 i.op[0].regs
629310ab 8064 = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7ab9ffdd 8065 i.types[0] = regxmm;
c0f3af97
L
8066 i.tm.operand_types[0] = regxmm;
8067
8068 i.operands += 2;
8069 i.reg_operands += 2;
8070 i.tm.operands += 2;
8071
91d6fa6a 8072 dupl++;
c0f3af97 8073 dest++;
91d6fa6a
NC
8074 i.op[dupl] = i.op[dest];
8075 i.types[dupl] = i.types[dest];
8076 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 8077 i.flags[dupl] = i.flags[dest];
e2ec9d29 8078 }
c0f3af97
L
8079 else
8080 {
dc1e8a47 8081 duplicate:
c0f3af97
L
8082 i.operands++;
8083 i.reg_operands++;
8084 i.tm.operands++;
8085
91d6fa6a
NC
8086 i.op[dupl] = i.op[dest];
8087 i.types[dupl] = i.types[dest];
8088 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 8089 i.flags[dupl] = i.flags[dest];
c0f3af97
L
8090 }
8091
8092 if (i.tm.opcode_modifier.immext)
8093 process_immext ();
8094 }
75e5731b 8095 else if (i.tm.operand_types[0].bitfield.instance == Accum
bd782808 8096 && i.tm.opcode_modifier.modrm)
c0f3af97
L
8097 {
8098 unsigned int j;
8099
9fcfb3d7
L
8100 for (j = 1; j < i.operands; j++)
8101 {
8102 i.op[j - 1] = i.op[j];
8103 i.types[j - 1] = i.types[j];
8104
8105 /* We need to adjust fields in i.tm since they are used by
8106 build_modrm_byte. */
8107 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
8dc0818e
JB
8108
8109 i.flags[j - 1] = i.flags[j];
9fcfb3d7
L
8110 }
8111
31b4cda3
JB
8112 /* No adjustment to i.reg_operands: This was already done at the top
8113 of the function. */
e2ec9d29 8114 i.operands--;
e2ec9d29
L
8115 i.tm.operands--;
8116 }
255571cd 8117 else if (i.tm.opcode_modifier.operandconstraint == IMPLICIT_QUAD_GROUP)
920d2ddc 8118 {
a477a8c4
JB
8119 unsigned int regnum, first_reg_in_group, last_reg_in_group;
8120
920d2ddc 8121 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
3528c362 8122 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
a477a8c4
JB
8123 regnum = register_number (i.op[1].regs);
8124 first_reg_in_group = regnum & ~3;
8125 last_reg_in_group = first_reg_in_group + 3;
8126 if (regnum != first_reg_in_group)
8127 as_warn (_("source register `%s%s' implicitly denotes"
8128 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
8129 register_prefix, i.op[1].regs->reg_name,
8130 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
8131 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
76d3f746 8132 insn_name (&i.tm));
a477a8c4 8133 }
255571cd 8134 else if (i.tm.opcode_modifier.operandconstraint == REG_KLUDGE)
e2ec9d29
L
8135 {
8136 /* The imul $imm, %reg instruction is converted into
8137 imul $imm, %reg, %reg, and the clr %reg instruction
8138 is converted into xor %reg, %reg. */
8139
8140 unsigned int first_reg_op;
8141
8142 if (operand_type_check (i.types[0], reg))
8143 first_reg_op = 0;
8144 else
8145 first_reg_op = 1;
8146 /* Pretend we saw the extra register operand. */
9c2799c2 8147 gas_assert (i.reg_operands == 1
7ab9ffdd 8148 && i.op[first_reg_op + 1].regs == 0);
e2ec9d29
L
8149 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
8150 i.types[first_reg_op + 1] = i.types[first_reg_op];
8151 i.operands++;
8152 i.reg_operands++;
29b0f896
AM
8153 }
8154
85b80b0f 8155 if (i.tm.opcode_modifier.modrm)
29b0f896
AM
8156 {
8157 /* The opcode is completed (modulo i.tm.extension_opcode which
52271982
AM
8158 must be put into the modrm byte). Now, we make the modrm and
8159 index base bytes based on all the info we've collected. */
29b0f896
AM
8160
8161 default_seg = build_modrm_byte ();
bd782808
JB
8162
8163 if (!quiet_warnings && i.tm.opcode_modifier.operandconstraint == UGH)
8164 {
8165 /* Warn about some common errors, but press on regardless. */
8166 if (i.operands == 2)
8167 {
8168 /* Reversed arguments on faddp or fmulp. */
8169 as_warn (_("translating to `%s %s%s,%s%s'"), insn_name (&i.tm),
8170 register_prefix, i.op[!intel_syntax].regs->reg_name,
8171 register_prefix, i.op[intel_syntax].regs->reg_name);
8172 }
8173 else if (i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
8174 {
8175 /* Extraneous `l' suffix on fp insn. */
8176 as_warn (_("translating to `%s %s%s'"), insn_name (&i.tm),
8177 register_prefix, i.op[0].regs->reg_name);
8178 }
8179 }
29b0f896 8180 }
00cee14f 8181 else if (i.types[0].bitfield.class == SReg)
85b80b0f
JB
8182 {
8183 if (flag_code != CODE_64BIT
8184 ? i.tm.base_opcode == POP_SEG_SHORT
8185 && i.op[0].regs->reg_num == 1
389d00a5 8186 : (i.tm.base_opcode | 1) == (POP_SEG386_SHORT & 0xff)
85b80b0f
JB
8187 && i.op[0].regs->reg_num < 4)
8188 {
8189 as_bad (_("you can't `%s %s%s'"),
76d3f746 8190 insn_name (&i.tm), register_prefix, i.op[0].regs->reg_name);
85b80b0f
JB
8191 return 0;
8192 }
389d00a5 8193 if (i.op[0].regs->reg_num > 3
ddb62495 8194 && i.tm.opcode_space == SPACE_BASE )
85b80b0f 8195 {
389d00a5 8196 i.tm.base_opcode ^= (POP_SEG_SHORT ^ POP_SEG386_SHORT) & 0xff;
ddb62495 8197 i.tm.opcode_space = SPACE_0F;
85b80b0f
JB
8198 }
8199 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
8200 }
ddb62495 8201 else if (i.tm.opcode_space == SPACE_BASE
389d00a5 8202 && (i.tm.base_opcode & ~3) == MOV_AX_DISP32)
29b0f896 8203 {
5e042380 8204 default_seg = reg_ds;
29b0f896 8205 }
40fb9820 8206 else if (i.tm.opcode_modifier.isstring)
29b0f896
AM
8207 {
8208 /* For the string instructions that allow a segment override
8209 on one of their operands, the default segment is ds. */
5e042380 8210 default_seg = reg_ds;
29b0f896 8211 }
50128d0c 8212 else if (i.short_form)
85b80b0f 8213 {
bd782808 8214 /* The register operand is in operand 0 or 1. */
4943d587 8215 const reg_entry *r = i.op[0].regs;
85b80b0f 8216
4943d587
JB
8217 if (i.imm_operands
8218 || (r->reg_type.bitfield.instance == Accum && i.op[1].regs))
8219 r = i.op[1].regs;
85b80b0f 8220 /* Register goes in low 3 bits of opcode. */
4943d587 8221 i.tm.base_opcode |= r->reg_num;
0a3eba42 8222 set_rex_vrex (r, REX_B, false);
85b80b0f 8223 }
29b0f896 8224
514a8bb0 8225 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7fc69528 8226 && i.tm.mnem_off == MN_lea)
92334ad2
JB
8227 {
8228 if (!quiet_warnings)
76d3f746 8229 as_warn (_("segment override on `%s' is ineffectual"), insn_name (&i.tm));
739d7649 8230 if (optimize && !i.no_optimize)
92334ad2
JB
8231 {
8232 i.seg[0] = NULL;
8233 i.prefix[SEG_PREFIX] = 0;
8234 }
8235 }
52271982
AM
8236
8237 /* If a segment was explicitly specified, and the specified segment
b6773884
JB
8238 is neither the default nor the one already recorded from a prefix,
8239 use an opcode prefix to select it. If we never figured out what
8240 the default segment is, then default_seg will be zero at this
8241 point, and the specified segment prefix will always be used. */
8242 if (i.seg[0]
8243 && i.seg[0] != default_seg
5e042380 8244 && i386_seg_prefixes[i.seg[0]->reg_num] != i.prefix[SEG_PREFIX])
29b0f896 8245 {
5e042380 8246 if (!add_prefix (i386_seg_prefixes[i.seg[0]->reg_num]))
29b0f896
AM
8247 return 0;
8248 }
8249 return 1;
8250}
8251
5e042380 8252static const reg_entry *
e3bb37b5 8253build_modrm_byte (void)
29b0f896 8254{
5e042380 8255 const reg_entry *default_seg = NULL;
c0f3af97 8256 unsigned int source, dest;
aa180741 8257 bool vex_3_sources = (i.reg_operands + i.mem_operands == 4);
c0f3af97 8258
c0f3af97
L
8259 if (vex_3_sources)
8260 {
91d6fa6a 8261 unsigned int nds, reg_slot;
4c2c6516 8262 expressionS *exp;
c0f3af97 8263
6b8d3588 8264 dest = i.operands - 1;
c0f3af97 8265 nds = dest - 1;
922d8de8 8266
a683cc34 8267 /* There are 2 kinds of instructions:
bed3d976 8268 1. 5 operands: 4 register operands or 3 register operands
9d3bf266 8269 plus 1 memory operand plus one Imm4 operand, VexXDS, and
bed3d976 8270 VexW0 or VexW1. The destination must be either XMM, YMM or
43234a1e 8271 ZMM register.
bed3d976 8272 2. 4 operands: 4 register operands or 3 register operands
2f1bada2 8273 plus 1 memory operand, with VexXDS. */
aa180741 8274 gas_assert (i.tm.opcode_modifier.vexvvvv == VEXXDS
dcd7e323 8275 && i.tm.opcode_modifier.vexw
3528c362 8276 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
a683cc34 8277
48db9223
JB
8278 /* If VexW1 is set, the first non-immediate operand is the source and
8279 the second non-immediate one is encoded in the immediate operand. */
8280 if (i.tm.opcode_modifier.vexw == VEXW1)
8281 {
8282 source = i.imm_operands;
8283 reg_slot = i.imm_operands + 1;
8284 }
8285 else
8286 {
8287 source = i.imm_operands + 1;
8288 reg_slot = i.imm_operands;
8289 }
8290
a683cc34 8291 if (i.imm_operands == 0)
bed3d976
JB
8292 {
8293 /* When there is no immediate operand, generate an 8bit
8294 immediate operand to encode the first operand. */
8295 exp = &im_expressions[i.imm_operands++];
8296 i.op[i.operands].imms = exp;
be1643ff 8297 i.types[i.operands].bitfield.imm8 = 1;
bed3d976
JB
8298 i.operands++;
8299
3528c362 8300 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
bed3d976
JB
8301 exp->X_op = O_constant;
8302 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
43234a1e
L
8303 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
8304 }
922d8de8 8305 else
bed3d976 8306 {
9d3bf266
JB
8307 gas_assert (i.imm_operands == 1);
8308 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
8309 gas_assert (!i.tm.opcode_modifier.immext);
a683cc34 8310
9d3bf266
JB
8311 /* Turn on Imm8 again so that output_imm will generate it. */
8312 i.types[0].bitfield.imm8 = 1;
bed3d976 8313
3528c362 8314 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
9d3bf266 8315 i.op[0].imms->X_add_number
bed3d976 8316 |= register_number (i.op[reg_slot].regs) << 4;
43234a1e 8317 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
bed3d976 8318 }
a683cc34 8319
3528c362 8320 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
dae39acc 8321 i.vex.register_specifier = i.op[nds].regs;
c0f3af97
L
8322 }
8323 else
8324 source = dest = 0;
29b0f896
AM
8325
8326 /* i.reg_operands MUST be the number of real register operands;
c0f3af97
L
8327 implicit registers do not count. If there are 3 register
8328 operands, it must be a instruction with VexNDS. For a
8329 instruction with VexNDD, the destination register is encoded
8330 in VEX prefix. If there are 4 register operands, it must be
8331 a instruction with VEX prefix and 3 sources. */
7ab9ffdd
L
8332 if (i.mem_operands == 0
8333 && ((i.reg_operands == 2
2426c15f 8334 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7ab9ffdd 8335 || (i.reg_operands == 3
2426c15f 8336 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd 8337 || (i.reg_operands == 4 && vex_3_sources)))
29b0f896 8338 {
cab737b9
L
8339 switch (i.operands)
8340 {
8341 case 2:
8342 source = 0;
8343 break;
8344 case 3:
c81128dc
L
8345 /* When there are 3 operands, one of them may be immediate,
8346 which may be the first or the last operand. Otherwise,
c0f3af97
L
8347 the first operand must be shift count register (cl) or it
8348 is an instruction with VexNDS. */
9c2799c2 8349 gas_assert (i.imm_operands == 1
7ab9ffdd 8350 || (i.imm_operands == 0
2426c15f 8351 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
75e5731b
JB
8352 || (i.types[0].bitfield.instance == RegC
8353 && i.types[0].bitfield.byte))));
40fb9820 8354 if (operand_type_check (i.types[0], imm)
75e5731b
JB
8355 || (i.types[0].bitfield.instance == RegC
8356 && i.types[0].bitfield.byte))
40fb9820
L
8357 source = 1;
8358 else
8359 source = 0;
cab737b9
L
8360 break;
8361 case 4:
368d64cc
L
8362 /* When there are 4 operands, the first two must be 8bit
8363 immediate operands. The source operand will be the 3rd
c0f3af97
L
8364 one.
8365
8366 For instructions with VexNDS, if the first operand
8367 an imm8, the source operand is the 2nd one. If the last
8368 operand is imm8, the source operand is the first one. */
9c2799c2 8369 gas_assert ((i.imm_operands == 2
7ab9ffdd
L
8370 && i.types[0].bitfield.imm8
8371 && i.types[1].bitfield.imm8)
2426c15f 8372 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7ab9ffdd
L
8373 && i.imm_operands == 1
8374 && (i.types[0].bitfield.imm8
c34d1cc9 8375 || i.types[0].bitfield.imm8s
cf665fee 8376 || i.types[i.operands - 1].bitfield.imm8)));
9f2670f2
L
8377 if (i.imm_operands == 2)
8378 source = 2;
8379 else
c0f3af97
L
8380 {
8381 if (i.types[0].bitfield.imm8)
8382 source = 1;
8383 else
8384 source = 0;
8385 }
c0f3af97
L
8386 break;
8387 case 5:
cf665fee
JB
8388 gas_assert (!is_evex_encoding (&i.tm));
8389 gas_assert (i.imm_operands == 1 && vex_3_sources);
cab737b9
L
8390 break;
8391 default:
8392 abort ();
8393 }
8394
c0f3af97
L
8395 if (!vex_3_sources)
8396 {
8397 dest = source + 1;
8398
2426c15f 8399 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
c0f3af97 8400 {
43234a1e 8401 /* For instructions with VexNDS, the register-only source
c5d0745b 8402 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
dfd69174 8403 register. It is encoded in VEX prefix. */
f12dc422
L
8404
8405 i386_operand_type op;
8406 unsigned int vvvv;
8407
c2ecccb3 8408 /* Swap two source operands if needed. */
255571cd 8409 if (i.tm.opcode_modifier.operandconstraint == SWAP_SOURCES)
f12dc422
L
8410 {
8411 vvvv = source;
8412 source = dest;
8413 }
8414 else
8415 vvvv = dest;
8416
8417 op = i.tm.operand_types[vvvv];
c0f3af97 8418 if ((dest + 1) >= i.operands
bab6aec1 8419 || ((op.bitfield.class != Reg
dc821c5f 8420 || (!op.bitfield.dword && !op.bitfield.qword))
3528c362 8421 && op.bitfield.class != RegSIMD
c0f327b8 8422 && op.bitfield.class != RegMask))
c0f3af97 8423 abort ();
f12dc422 8424 i.vex.register_specifier = i.op[vvvv].regs;
c0f3af97
L
8425 dest++;
8426 }
8427 }
29b0f896
AM
8428
8429 i.rm.mode = 3;
dfd69174
JB
8430 /* One of the register operands will be encoded in the i.rm.reg
8431 field, the other in the combined i.rm.mode and i.rm.regmem
29b0f896
AM
8432 fields. If no form of this instruction supports a memory
8433 destination operand, then we assume the source operand may
8434 sometimes be a memory operand and so we need to store the
8435 destination in the i.rm.reg field. */
dfd69174 8436 if (!i.tm.opcode_modifier.regmem
40fb9820 8437 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
29b0f896
AM
8438 {
8439 i.rm.reg = i.op[dest].regs->reg_num;
8440 i.rm.regmem = i.op[source].regs->reg_num;
a5aeccd9 8441 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
5b7c81bd 8442 set_rex_vrex (i.op[source].regs, REX_B, false);
29b0f896
AM
8443 }
8444 else
8445 {
8446 i.rm.reg = i.op[source].regs->reg_num;
8447 i.rm.regmem = i.op[dest].regs->reg_num;
a5aeccd9 8448 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
5b7c81bd 8449 set_rex_vrex (i.op[source].regs, REX_R, false);
29b0f896 8450 }
e0c7f900 8451 if (flag_code != CODE_64BIT && (i.rex & REX_R))
c4a530c5 8452 {
4a5c67ed 8453 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
c4a530c5 8454 abort ();
e0c7f900 8455 i.rex &= ~REX_R;
c4a530c5
JB
8456 add_prefix (LOCK_PREFIX_OPCODE);
8457 }
29b0f896
AM
8458 }
8459 else
8460 { /* If it's not 2 reg operands... */
c0f3af97
L
8461 unsigned int mem;
8462
29b0f896
AM
8463 if (i.mem_operands)
8464 {
8465 unsigned int fake_zero_displacement = 0;
99018f42 8466 unsigned int op;
4eed87de 8467
7ab9ffdd 8468 for (op = 0; op < i.operands; op++)
8dc0818e 8469 if (i.flags[op] & Operand_Mem)
7ab9ffdd 8470 break;
7ab9ffdd 8471 gas_assert (op < i.operands);
29b0f896 8472
63112cd6 8473 if (i.tm.opcode_modifier.sib)
6c30d220 8474 {
260cd341
LC
8475 /* The index register of VSIB shouldn't be RegIZ. */
8476 if (i.tm.opcode_modifier.sib != SIBMEM
8477 && i.index_reg->reg_num == RegIZ)
6c30d220
L
8478 abort ();
8479
8480 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8481 if (!i.base_reg)
8482 {
8483 i.sib.base = NO_BASE_REGISTER;
8484 i.sib.scale = i.log2_scale_factor;
2f2be86b 8485 i.types[op] = operand_type_and_not (i.types[op], anydisp);
a775efc8 8486 i.types[op].bitfield.disp32 = 1;
6c30d220 8487 }
260cd341
LC
8488
8489 /* Since the mandatory SIB always has index register, so
8490 the code logic remains unchanged. The non-mandatory SIB
8491 without index register is allowed and will be handled
8492 later. */
8493 if (i.index_reg)
8494 {
8495 if (i.index_reg->reg_num == RegIZ)
8496 i.sib.index = NO_INDEX_REGISTER;
8497 else
8498 i.sib.index = i.index_reg->reg_num;
5b7c81bd 8499 set_rex_vrex (i.index_reg, REX_X, false);
260cd341 8500 }
6c30d220
L
8501 }
8502
5e042380 8503 default_seg = reg_ds;
29b0f896
AM
8504
8505 if (i.base_reg == 0)
8506 {
8507 i.rm.mode = 0;
8508 if (!i.disp_operands)
9bb129e8 8509 fake_zero_displacement = 1;
29b0f896
AM
8510 if (i.index_reg == 0)
8511 {
260cd341
LC
8512 /* Both check for VSIB and mandatory non-vector SIB. */
8513 gas_assert (!i.tm.opcode_modifier.sib
8514 || i.tm.opcode_modifier.sib == SIBMEM);
29b0f896 8515 /* Operand is just <disp> */
2f2be86b 8516 i.types[op] = operand_type_and_not (i.types[op], anydisp);
20f0a1fc 8517 if (flag_code == CODE_64BIT)
29b0f896
AM
8518 {
8519 /* 64bit mode overwrites the 32bit absolute
8520 addressing by RIP relative addressing and
8521 absolute addressing is encoded by one of the
8522 redundant SIB forms. */
8523 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8524 i.sib.base = NO_BASE_REGISTER;
8525 i.sib.index = NO_INDEX_REGISTER;
a775efc8 8526 i.types[op].bitfield.disp32 = 1;
20f0a1fc 8527 }
fc225355
L
8528 else if ((flag_code == CODE_16BIT)
8529 ^ (i.prefix[ADDR_PREFIX] != 0))
20f0a1fc
NC
8530 {
8531 i.rm.regmem = NO_BASE_REGISTER_16;
2f2be86b 8532 i.types[op].bitfield.disp16 = 1;
20f0a1fc
NC
8533 }
8534 else
8535 {
8536 i.rm.regmem = NO_BASE_REGISTER;
2f2be86b 8537 i.types[op].bitfield.disp32 = 1;
29b0f896
AM
8538 }
8539 }
63112cd6 8540 else if (!i.tm.opcode_modifier.sib)
29b0f896 8541 {
6c30d220 8542 /* !i.base_reg && i.index_reg */
e968fc9b 8543 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8544 i.sib.index = NO_INDEX_REGISTER;
8545 else
8546 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8547 i.sib.base = NO_BASE_REGISTER;
8548 i.sib.scale = i.log2_scale_factor;
8549 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
2f2be86b 8550 i.types[op] = operand_type_and_not (i.types[op], anydisp);
a775efc8 8551 i.types[op].bitfield.disp32 = 1;
29b0f896 8552 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8553 i.rex |= REX_X;
29b0f896
AM
8554 }
8555 }
8556 /* RIP addressing for 64bit mode. */
e968fc9b 8557 else if (i.base_reg->reg_num == RegIP)
29b0f896 8558 {
63112cd6 8559 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8560 i.rm.regmem = NO_BASE_REGISTER;
40fb9820
L
8561 i.types[op].bitfield.disp8 = 0;
8562 i.types[op].bitfield.disp16 = 0;
a775efc8 8563 i.types[op].bitfield.disp32 = 1;
40fb9820 8564 i.types[op].bitfield.disp64 = 0;
71903a11 8565 i.flags[op] |= Operand_PCrel;
20f0a1fc
NC
8566 if (! i.disp_operands)
8567 fake_zero_displacement = 1;
29b0f896 8568 }
dc821c5f 8569 else if (i.base_reg->reg_type.bitfield.word)
29b0f896 8570 {
63112cd6 8571 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8572 switch (i.base_reg->reg_num)
8573 {
8574 case 3: /* (%bx) */
8575 if (i.index_reg == 0)
8576 i.rm.regmem = 7;
8577 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8578 i.rm.regmem = i.index_reg->reg_num - 6;
8579 break;
8580 case 5: /* (%bp) */
5e042380 8581 default_seg = reg_ss;
29b0f896
AM
8582 if (i.index_reg == 0)
8583 {
8584 i.rm.regmem = 6;
40fb9820 8585 if (operand_type_check (i.types[op], disp) == 0)
29b0f896
AM
8586 {
8587 /* fake (%bp) into 0(%bp) */
41eb8e88 8588 if (i.disp_encoding == disp_encoding_16bit)
1a02d6b0
L
8589 i.types[op].bitfield.disp16 = 1;
8590 else
8591 i.types[op].bitfield.disp8 = 1;
252b5132 8592 fake_zero_displacement = 1;
29b0f896
AM
8593 }
8594 }
8595 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8596 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8597 break;
8598 default: /* (%si) -> 4 or (%di) -> 5 */
8599 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8600 }
41eb8e88
L
8601 if (!fake_zero_displacement
8602 && !i.disp_operands
8603 && i.disp_encoding)
8604 {
8605 fake_zero_displacement = 1;
8606 if (i.disp_encoding == disp_encoding_8bit)
8607 i.types[op].bitfield.disp8 = 1;
8608 else
8609 i.types[op].bitfield.disp16 = 1;
8610 }
29b0f896
AM
8611 i.rm.mode = mode_from_disp_size (i.types[op]);
8612 }
8613 else /* i.base_reg and 32/64 bit mode */
8614 {
a9aabc23 8615 if (operand_type_check (i.types[op], disp))
40fb9820 8616 {
73053c1f
JB
8617 i.types[op].bitfield.disp16 = 0;
8618 i.types[op].bitfield.disp64 = 0;
a775efc8 8619 i.types[op].bitfield.disp32 = 1;
40fb9820 8620 }
20f0a1fc 8621
63112cd6 8622 if (!i.tm.opcode_modifier.sib)
6c30d220 8623 i.rm.regmem = i.base_reg->reg_num;
29b0f896 8624 if ((i.base_reg->reg_flags & RegRex) != 0)
161a04f6 8625 i.rex |= REX_B;
29b0f896
AM
8626 i.sib.base = i.base_reg->reg_num;
8627 /* x86-64 ignores REX prefix bit here to avoid decoder
8628 complications. */
848930b2
JB
8629 if (!(i.base_reg->reg_flags & RegRex)
8630 && (i.base_reg->reg_num == EBP_REG_NUM
8631 || i.base_reg->reg_num == ESP_REG_NUM))
5e042380 8632 default_seg = reg_ss;
848930b2 8633 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
29b0f896 8634 {
848930b2 8635 fake_zero_displacement = 1;
1a02d6b0
L
8636 if (i.disp_encoding == disp_encoding_32bit)
8637 i.types[op].bitfield.disp32 = 1;
8638 else
8639 i.types[op].bitfield.disp8 = 1;
29b0f896
AM
8640 }
8641 i.sib.scale = i.log2_scale_factor;
8642 if (i.index_reg == 0)
8643 {
260cd341
LC
8644 /* Only check for VSIB. */
8645 gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8646 && i.tm.opcode_modifier.sib != VECSIB256
8647 && i.tm.opcode_modifier.sib != VECSIB512);
8648
29b0f896
AM
8649 /* <disp>(%esp) becomes two byte modrm with no index
8650 register. We've already stored the code for esp
8651 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8652 Any base register besides %esp will not use the
8653 extra modrm byte. */
8654 i.sib.index = NO_INDEX_REGISTER;
29b0f896 8655 }
63112cd6 8656 else if (!i.tm.opcode_modifier.sib)
29b0f896 8657 {
e968fc9b 8658 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8659 i.sib.index = NO_INDEX_REGISTER;
8660 else
8661 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8662 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8663 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8664 i.rex |= REX_X;
29b0f896 8665 }
67a4f2b7
AO
8666
8667 if (i.disp_operands
8668 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8669 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8670 i.rm.mode = 0;
8671 else
a501d77e
L
8672 {
8673 if (!fake_zero_displacement
8674 && !i.disp_operands
8675 && i.disp_encoding)
8676 {
8677 fake_zero_displacement = 1;
8678 if (i.disp_encoding == disp_encoding_8bit)
8679 i.types[op].bitfield.disp8 = 1;
8680 else
8681 i.types[op].bitfield.disp32 = 1;
8682 }
8683 i.rm.mode = mode_from_disp_size (i.types[op]);
8684 }
29b0f896 8685 }
252b5132 8686
29b0f896
AM
8687 if (fake_zero_displacement)
8688 {
8689 /* Fakes a zero displacement assuming that i.types[op]
8690 holds the correct displacement size. */
8691 expressionS *exp;
8692
9c2799c2 8693 gas_assert (i.op[op].disps == 0);
29b0f896
AM
8694 exp = &disp_expressions[i.disp_operands++];
8695 i.op[op].disps = exp;
8696 exp->X_op = O_constant;
8697 exp->X_add_number = 0;
8698 exp->X_add_symbol = (symbolS *) 0;
8699 exp->X_op_symbol = (symbolS *) 0;
8700 }
c0f3af97
L
8701
8702 mem = op;
29b0f896 8703 }
c0f3af97
L
8704 else
8705 mem = ~0;
252b5132 8706
5dab1799 8707 if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
f88c9eb0
SP
8708 {
8709 i.vex.register_specifier = i.op[2].regs;
8710 if (!i.mem_operands)
8711 {
8712 i.rm.mode = 3;
8713 i.rm.regmem = i.op[1].regs->reg_num;
8714 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8715 i.rex |= REX_B;
8716 }
8717 }
29b0f896
AM
8718 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8719 (if any) based on i.tm.extension_opcode. Again, we must be
8720 careful to make sure that segment/control/debug/test/MMX
8721 registers are coded into the i.rm.reg field. */
f88c9eb0 8722 else if (i.reg_operands)
29b0f896 8723 {
99018f42 8724 unsigned int op;
7ab9ffdd
L
8725 unsigned int vex_reg = ~0;
8726
8727 for (op = 0; op < i.operands; op++)
921eafea
L
8728 if (i.types[op].bitfield.class == Reg
8729 || i.types[op].bitfield.class == RegBND
8730 || i.types[op].bitfield.class == RegMask
8731 || i.types[op].bitfield.class == SReg
8732 || i.types[op].bitfield.class == RegCR
8733 || i.types[op].bitfield.class == RegDR
8734 || i.types[op].bitfield.class == RegTR
8735 || i.types[op].bitfield.class == RegSIMD
8736 || i.types[op].bitfield.class == RegMMX)
8737 break;
c0209578 8738
7ab9ffdd
L
8739 if (vex_3_sources)
8740 op = dest;
2426c15f 8741 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd
L
8742 {
8743 /* For instructions with VexNDS, the register-only
8744 source operand is encoded in VEX prefix. */
8745 gas_assert (mem != (unsigned int) ~0);
c0f3af97 8746
a93e3234 8747 if (op > mem || i.tm.cpu_flags.bitfield.cpucmpccxadd)
c0f3af97 8748 {
7ab9ffdd
L
8749 vex_reg = op++;
8750 gas_assert (op < i.operands);
c0f3af97
L
8751 }
8752 else
c0f3af97 8753 {
f12dc422
L
8754 /* Check register-only source operand when two source
8755 operands are swapped. */
8756 if (!i.tm.operand_types[op].bitfield.baseindex
8757 && i.tm.operand_types[op + 1].bitfield.baseindex)
8758 {
8759 vex_reg = op;
8760 op += 2;
8761 gas_assert (mem == (vex_reg + 1)
8762 && op < i.operands);
8763 }
8764 else
8765 {
8766 vex_reg = op + 1;
8767 gas_assert (vex_reg < i.operands);
8768 }
c0f3af97 8769 }
7ab9ffdd 8770 }
2426c15f 8771 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7ab9ffdd 8772 {
f12dc422 8773 /* For instructions with VexNDD, the register destination
7ab9ffdd 8774 is encoded in VEX prefix. */
f12dc422
L
8775 if (i.mem_operands == 0)
8776 {
8777 /* There is no memory operand. */
8778 gas_assert ((op + 2) == i.operands);
8779 vex_reg = op + 1;
8780 }
8781 else
8d63c93e 8782 {
ed438a93
JB
8783 /* There are only 2 non-immediate operands. */
8784 gas_assert (op < i.imm_operands + 2
8785 && i.operands == i.imm_operands + 2);
8786 vex_reg = i.imm_operands + 1;
f12dc422 8787 }
7ab9ffdd
L
8788 }
8789 else
8790 gas_assert (op < i.operands);
99018f42 8791
7ab9ffdd
L
8792 if (vex_reg != (unsigned int) ~0)
8793 {
f12dc422 8794 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7ab9ffdd 8795
bab6aec1 8796 if ((type->bitfield.class != Reg
dc821c5f 8797 || (!type->bitfield.dword && !type->bitfield.qword))
3528c362 8798 && type->bitfield.class != RegSIMD
c0f327b8 8799 && type->bitfield.class != RegMask)
7ab9ffdd 8800 abort ();
f88c9eb0 8801
7ab9ffdd
L
8802 i.vex.register_specifier = i.op[vex_reg].regs;
8803 }
8804
1b9f0c97
L
8805 /* Don't set OP operand twice. */
8806 if (vex_reg != op)
7ab9ffdd 8807 {
1b9f0c97
L
8808 /* If there is an extension opcode to put here, the
8809 register number must be put into the regmem field. */
8810 if (i.tm.extension_opcode != None)
8811 {
8812 i.rm.regmem = i.op[op].regs->reg_num;
a5aeccd9
JB
8813 set_rex_vrex (i.op[op].regs, REX_B,
8814 i.tm.opcode_modifier.sse2avx);
1b9f0c97
L
8815 }
8816 else
8817 {
8818 i.rm.reg = i.op[op].regs->reg_num;
a5aeccd9
JB
8819 set_rex_vrex (i.op[op].regs, REX_R,
8820 i.tm.opcode_modifier.sse2avx);
1b9f0c97 8821 }
7ab9ffdd 8822 }
252b5132 8823
29b0f896
AM
8824 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8825 must set it to 3 to indicate this is a register operand
8826 in the regmem field. */
8827 if (!i.mem_operands)
8828 i.rm.mode = 3;
8829 }
252b5132 8830
29b0f896 8831 /* Fill in i.rm.reg field with extension opcode (if any). */
c1e679ec 8832 if (i.tm.extension_opcode != None)
29b0f896
AM
8833 i.rm.reg = i.tm.extension_opcode;
8834 }
8835 return default_seg;
8836}
252b5132 8837
48ef937e
JB
8838static INLINE void
8839frag_opcode_byte (unsigned char byte)
8840{
8841 if (now_seg != absolute_section)
8842 FRAG_APPEND_1_CHAR (byte);
8843 else
8844 ++abs_section_offset;
8845}
8846
376cd056
JB
8847static unsigned int
8848flip_code16 (unsigned int code16)
8849{
8850 gas_assert (i.tm.operands == 1);
8851
8852 return !(i.prefix[REX_PREFIX] & REX_W)
8853 && (code16 ? i.tm.operand_types[0].bitfield.disp32
376cd056
JB
8854 : i.tm.operand_types[0].bitfield.disp16)
8855 ? CODE16 : 0;
8856}
8857
29b0f896 8858static void
e3bb37b5 8859output_branch (void)
29b0f896
AM
8860{
8861 char *p;
f8a5c266 8862 int size;
29b0f896
AM
8863 int code16;
8864 int prefix;
8865 relax_substateT subtype;
8866 symbolS *sym;
8867 offsetT off;
8868
48ef937e
JB
8869 if (now_seg == absolute_section)
8870 {
8871 as_bad (_("relaxable branches not supported in absolute section"));
8872 return;
8873 }
8874
f8a5c266 8875 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
1a42a9fe 8876 size = i.disp_encoding > disp_encoding_8bit ? BIG : SMALL;
29b0f896
AM
8877
8878 prefix = 0;
8879 if (i.prefix[DATA_PREFIX] != 0)
252b5132 8880 {
29b0f896
AM
8881 prefix = 1;
8882 i.prefixes -= 1;
376cd056 8883 code16 ^= flip_code16(code16);
252b5132 8884 }
29b0f896
AM
8885 /* Pentium4 branch hints. */
8886 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8887 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
2f66722d 8888 {
29b0f896
AM
8889 prefix++;
8890 i.prefixes--;
8891 }
8892 if (i.prefix[REX_PREFIX] != 0)
8893 {
8894 prefix++;
8895 i.prefixes--;
2f66722d
AM
8896 }
8897
7e8b059b
L
8898 /* BND prefixed jump. */
8899 if (i.prefix[BND_PREFIX] != 0)
8900 {
6cb0a70e
JB
8901 prefix++;
8902 i.prefixes--;
7e8b059b
L
8903 }
8904
f2810fe0 8905 if (i.prefixes != 0)
76d3f746 8906 as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
29b0f896
AM
8907
8908 /* It's always a symbol; End frag & setup for relax.
8909 Make sure there is enough room in this frag for the largest
8910 instruction we may generate in md_convert_frag. This is 2
8911 bytes for the opcode and room for the prefix and largest
8912 displacement. */
8913 frag_grow (prefix + 2 + 4);
8914 /* Prefix and 1 opcode byte go in fr_fix. */
8915 p = frag_more (prefix + 1);
8916 if (i.prefix[DATA_PREFIX] != 0)
8917 *p++ = DATA_PREFIX_OPCODE;
8918 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8919 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8920 *p++ = i.prefix[SEG_PREFIX];
6cb0a70e
JB
8921 if (i.prefix[BND_PREFIX] != 0)
8922 *p++ = BND_PREFIX_OPCODE;
29b0f896
AM
8923 if (i.prefix[REX_PREFIX] != 0)
8924 *p++ = i.prefix[REX_PREFIX];
8925 *p = i.tm.base_opcode;
8926
8927 if ((unsigned char) *p == JUMP_PC_RELATIVE)
f8a5c266 8928 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
40fb9820 8929 else if (cpu_arch_flags.bitfield.cpui386)
f8a5c266 8930 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
29b0f896 8931 else
f8a5c266 8932 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
29b0f896 8933 subtype |= code16;
3e73aa7c 8934
29b0f896
AM
8935 sym = i.op[0].disps->X_add_symbol;
8936 off = i.op[0].disps->X_add_number;
3e73aa7c 8937
29b0f896
AM
8938 if (i.op[0].disps->X_op != O_constant
8939 && i.op[0].disps->X_op != O_symbol)
3e73aa7c 8940 {
29b0f896
AM
8941 /* Handle complex expressions. */
8942 sym = make_expr_symbol (i.op[0].disps);
8943 off = 0;
8944 }
3e73aa7c 8945
1ef3994a
JB
8946 frag_now->tc_frag_data.code64 = flag_code == CODE_64BIT;
8947
29b0f896
AM
8948 /* 1 possible extra opcode + 4 byte displacement go in var part.
8949 Pass reloc in fr_var. */
d258b828 8950 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
29b0f896 8951}
3e73aa7c 8952
bd7ab16b
L
8953#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8954/* Return TRUE iff PLT32 relocation should be used for branching to
8955 symbol S. */
8956
5b7c81bd 8957static bool
bd7ab16b
L
8958need_plt32_p (symbolS *s)
8959{
8960 /* PLT32 relocation is ELF only. */
8961 if (!IS_ELF)
5b7c81bd 8962 return false;
bd7ab16b 8963
a5def729
RO
8964#ifdef TE_SOLARIS
8965 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8966 krtld support it. */
5b7c81bd 8967 return false;
a5def729
RO
8968#endif
8969
bd7ab16b
L
8970 /* Since there is no need to prepare for PLT branch on x86-64, we
8971 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8972 be used as a marker for 32-bit PC-relative branches. */
8973 if (!object_64bit)
5b7c81bd 8974 return false;
bd7ab16b 8975
44365e88 8976 if (s == NULL)
5b7c81bd 8977 return false;
44365e88 8978
bd7ab16b
L
8979 /* Weak or undefined symbol need PLT32 relocation. */
8980 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
5b7c81bd 8981 return true;
bd7ab16b
L
8982
8983 /* Non-global symbol doesn't need PLT32 relocation. */
8984 if (! S_IS_EXTERNAL (s))
5b7c81bd 8985 return false;
bd7ab16b
L
8986
8987 /* Other global symbols need PLT32 relocation. NB: Symbol with
8988 non-default visibilities are treated as normal global symbol
8989 so that PLT32 relocation can be used as a marker for 32-bit
8990 PC-relative branches. It is useful for linker relaxation. */
5b7c81bd 8991 return true;
bd7ab16b
L
8992}
8993#endif
8994
29b0f896 8995static void
e3bb37b5 8996output_jump (void)
29b0f896
AM
8997{
8998 char *p;
8999 int size;
3e02c1cc 9000 fixS *fixP;
bd7ab16b 9001 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
29b0f896 9002
0cfa3eb3 9003 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
9004 {
9005 /* This is a loop or jecxz type instruction. */
9006 size = 1;
9007 if (i.prefix[ADDR_PREFIX] != 0)
9008 {
48ef937e 9009 frag_opcode_byte (ADDR_PREFIX_OPCODE);
29b0f896
AM
9010 i.prefixes -= 1;
9011 }
9012 /* Pentium4 branch hints. */
9013 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
9014 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
9015 {
48ef937e 9016 frag_opcode_byte (i.prefix[SEG_PREFIX]);
29b0f896 9017 i.prefixes--;
3e73aa7c
JH
9018 }
9019 }
29b0f896
AM
9020 else
9021 {
9022 int code16;
3e73aa7c 9023
29b0f896
AM
9024 code16 = 0;
9025 if (flag_code == CODE_16BIT)
9026 code16 = CODE16;
3e73aa7c 9027
29b0f896
AM
9028 if (i.prefix[DATA_PREFIX] != 0)
9029 {
48ef937e 9030 frag_opcode_byte (DATA_PREFIX_OPCODE);
29b0f896 9031 i.prefixes -= 1;
376cd056 9032 code16 ^= flip_code16(code16);
29b0f896 9033 }
252b5132 9034
29b0f896
AM
9035 size = 4;
9036 if (code16)
9037 size = 2;
9038 }
9fcc94b6 9039
6cb0a70e
JB
9040 /* BND prefixed jump. */
9041 if (i.prefix[BND_PREFIX] != 0)
29b0f896 9042 {
48ef937e 9043 frag_opcode_byte (i.prefix[BND_PREFIX]);
29b0f896
AM
9044 i.prefixes -= 1;
9045 }
252b5132 9046
6cb0a70e 9047 if (i.prefix[REX_PREFIX] != 0)
7e8b059b 9048 {
48ef937e 9049 frag_opcode_byte (i.prefix[REX_PREFIX]);
7e8b059b
L
9050 i.prefixes -= 1;
9051 }
9052
f2810fe0 9053 if (i.prefixes != 0)
76d3f746 9054 as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
e0890092 9055
48ef937e
JB
9056 if (now_seg == absolute_section)
9057 {
9a182d04 9058 abs_section_offset += i.opcode_length + size;
48ef937e
JB
9059 return;
9060 }
9061
9a182d04
JB
9062 p = frag_more (i.opcode_length + size);
9063 switch (i.opcode_length)
42164a71
L
9064 {
9065 case 2:
9066 *p++ = i.tm.base_opcode >> 8;
1a0670f3 9067 /* Fall through. */
42164a71
L
9068 case 1:
9069 *p++ = i.tm.base_opcode;
9070 break;
9071 default:
9072 abort ();
9073 }
e0890092 9074
bd7ab16b 9075#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1ef3994a
JB
9076 if (flag_code == CODE_64BIT && size == 4
9077 && jump_reloc == NO_RELOC && i.op[0].disps->X_add_number == 0
bd7ab16b
L
9078 && need_plt32_p (i.op[0].disps->X_add_symbol))
9079 jump_reloc = BFD_RELOC_X86_64_PLT32;
9080#endif
9081
9082 jump_reloc = reloc (size, 1, 1, jump_reloc);
9083
3e02c1cc 9084 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
bd7ab16b 9085 i.op[0].disps, 1, jump_reloc);
3e02c1cc 9086
eb19308f
JB
9087 /* All jumps handled here are signed, but don't unconditionally use a
9088 signed limit check for 32 and 16 bit jumps as we want to allow wrap
9089 around at 4G (outside of 64-bit mode) and 64k (except for XBEGIN)
9090 respectively. */
9091 switch (size)
9092 {
9093 case 1:
9094 fixP->fx_signed = 1;
9095 break;
9096
9097 case 2:
7fc69528 9098 if (i.tm.mnem_off == MN_xbegin)
eb19308f
JB
9099 fixP->fx_signed = 1;
9100 break;
9101
9102 case 4:
9103 if (flag_code == CODE_64BIT)
9104 fixP->fx_signed = 1;
9105 break;
9106 }
29b0f896 9107}
e0890092 9108
29b0f896 9109static void
e3bb37b5 9110output_interseg_jump (void)
29b0f896
AM
9111{
9112 char *p;
9113 int size;
9114 int prefix;
9115 int code16;
252b5132 9116
29b0f896
AM
9117 code16 = 0;
9118 if (flag_code == CODE_16BIT)
9119 code16 = CODE16;
a217f122 9120
29b0f896
AM
9121 prefix = 0;
9122 if (i.prefix[DATA_PREFIX] != 0)
9123 {
9124 prefix = 1;
9125 i.prefixes -= 1;
9126 code16 ^= CODE16;
9127 }
6cb0a70e
JB
9128
9129 gas_assert (!i.prefix[REX_PREFIX]);
252b5132 9130
29b0f896
AM
9131 size = 4;
9132 if (code16)
9133 size = 2;
252b5132 9134
f2810fe0 9135 if (i.prefixes != 0)
76d3f746 9136 as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
252b5132 9137
48ef937e
JB
9138 if (now_seg == absolute_section)
9139 {
9140 abs_section_offset += prefix + 1 + 2 + size;
9141 return;
9142 }
9143
29b0f896
AM
9144 /* 1 opcode; 2 segment; offset */
9145 p = frag_more (prefix + 1 + 2 + size);
3e73aa7c 9146
29b0f896
AM
9147 if (i.prefix[DATA_PREFIX] != 0)
9148 *p++ = DATA_PREFIX_OPCODE;
252b5132 9149
29b0f896
AM
9150 if (i.prefix[REX_PREFIX] != 0)
9151 *p++ = i.prefix[REX_PREFIX];
252b5132 9152
29b0f896
AM
9153 *p++ = i.tm.base_opcode;
9154 if (i.op[1].imms->X_op == O_constant)
9155 {
9156 offsetT n = i.op[1].imms->X_add_number;
252b5132 9157
29b0f896
AM
9158 if (size == 2
9159 && !fits_in_unsigned_word (n)
9160 && !fits_in_signed_word (n))
9161 {
9162 as_bad (_("16-bit jump out of range"));
9163 return;
9164 }
9165 md_number_to_chars (p, n, size);
9166 }
9167 else
9168 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
d258b828 9169 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
6d96a594
C
9170
9171 p += size;
9172 if (i.op[0].imms->X_op == O_constant)
9173 md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
9174 else
9175 fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
9176 i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
29b0f896 9177}
a217f122 9178
b4a3a7b4
L
9179#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9180void
9181x86_cleanup (void)
9182{
9183 char *p;
9184 asection *seg = now_seg;
9185 subsegT subseg = now_subseg;
9186 asection *sec;
9187 unsigned int alignment, align_size_1;
9188 unsigned int isa_1_descsz, feature_2_descsz, descsz;
9189 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
9190 unsigned int padding;
9191
1273b2f8 9192 if (!IS_ELF || !x86_used_note)
b4a3a7b4
L
9193 return;
9194
b4a3a7b4
L
9195 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
9196
9197 /* The .note.gnu.property section layout:
9198
9199 Field Length Contents
9200 ---- ---- ----
9201 n_namsz 4 4
9202 n_descsz 4 The note descriptor size
9203 n_type 4 NT_GNU_PROPERTY_TYPE_0
9204 n_name 4 "GNU"
9205 n_desc n_descsz The program property array
9206 .... .... ....
9207 */
9208
9209 /* Create the .note.gnu.property section. */
9210 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
fd361982 9211 bfd_set_section_flags (sec,
b4a3a7b4
L
9212 (SEC_ALLOC
9213 | SEC_LOAD
9214 | SEC_DATA
9215 | SEC_HAS_CONTENTS
9216 | SEC_READONLY));
9217
9218 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
9219 {
9220 align_size_1 = 7;
9221 alignment = 3;
9222 }
9223 else
9224 {
9225 align_size_1 = 3;
9226 alignment = 2;
9227 }
9228
fd361982 9229 bfd_set_section_alignment (sec, alignment);
b4a3a7b4
L
9230 elf_section_type (sec) = SHT_NOTE;
9231
1273b2f8
L
9232 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
9233 + 4-byte data */
9234 isa_1_descsz_raw = 4 + 4 + 4;
9235 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
9236 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
b4a3a7b4
L
9237
9238 feature_2_descsz_raw = isa_1_descsz;
9239 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
1273b2f8 9240 + 4-byte data */
b4a3a7b4
L
9241 feature_2_descsz_raw += 4 + 4 + 4;
9242 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
9243 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
9244 & ~align_size_1);
9245
9246 descsz = feature_2_descsz;
9247 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
9248 p = frag_more (4 + 4 + 4 + 4 + descsz);
9249
9250 /* Write n_namsz. */
9251 md_number_to_chars (p, (valueT) 4, 4);
9252
9253 /* Write n_descsz. */
9254 md_number_to_chars (p + 4, (valueT) descsz, 4);
9255
9256 /* Write n_type. */
9257 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
9258
9259 /* Write n_name. */
9260 memcpy (p + 4 * 3, "GNU", 4);
9261
1273b2f8
L
9262 /* Write 4-byte type. */
9263 md_number_to_chars (p + 4 * 4,
9264 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
b4a3a7b4 9265
1273b2f8
L
9266 /* Write 4-byte data size. */
9267 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
b4a3a7b4 9268
1273b2f8
L
9269 /* Write 4-byte data. */
9270 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
b4a3a7b4 9271
1273b2f8
L
9272 /* Zero out paddings. */
9273 padding = isa_1_descsz - isa_1_descsz_raw;
9274 if (padding)
9275 memset (p + 4 * 7, 0, padding);
b4a3a7b4
L
9276
9277 /* Write 4-byte type. */
9278 md_number_to_chars (p + isa_1_descsz + 4 * 4,
9279 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
9280
9281 /* Write 4-byte data size. */
9282 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
9283
9284 /* Write 4-byte data. */
9285 md_number_to_chars (p + isa_1_descsz + 4 * 6,
9286 (valueT) x86_feature_2_used, 4);
9287
9288 /* Zero out paddings. */
9289 padding = feature_2_descsz - feature_2_descsz_raw;
9290 if (padding)
9291 memset (p + isa_1_descsz + 4 * 7, 0, padding);
9292
9293 /* We probably can't restore the current segment, for there likely
9294 isn't one yet... */
9295 if (seg && subseg)
9296 subseg_set (seg, subseg);
9297}
b52c4ee4
IB
9298
9299bool
9300x86_support_sframe_p (void)
9301{
3e3e792a 9302 /* At this time, SFrame stack trace is supported for AMD64 ABI only. */
b52c4ee4
IB
9303 return (x86_elf_abi == X86_64_ABI);
9304}
9305
9306bool
9307x86_sframe_ra_tracking_p (void)
9308{
9309 /* In AMD64, return address is always stored on the stack at a fixed offset
9310 from the CFA (provided via x86_sframe_cfa_ra_offset ()).
9311 Do not track explicitly via an SFrame Frame Row Entry. */
9312 return false;
9313}
9314
9315offsetT
9316x86_sframe_cfa_ra_offset (void)
9317{
9318 gas_assert (x86_elf_abi == X86_64_ABI);
9319 return (offsetT) -8;
9320}
9321
9322unsigned char
9323x86_sframe_get_abi_arch (void)
9324{
9325 unsigned char sframe_abi_arch = 0;
9326
9327 if (x86_support_sframe_p ())
9328 {
9329 gas_assert (!target_big_endian);
9330 sframe_abi_arch = SFRAME_ABI_AMD64_ENDIAN_LITTLE;
9331 }
9332
9333 return sframe_abi_arch;
9334}
9335
b4a3a7b4
L
9336#endif
9337
9c33702b
JB
9338static unsigned int
9339encoding_length (const fragS *start_frag, offsetT start_off,
9340 const char *frag_now_ptr)
9341{
9342 unsigned int len = 0;
9343
9344 if (start_frag != frag_now)
9345 {
9346 const fragS *fr = start_frag;
9347
9348 do {
9349 len += fr->fr_fix;
9350 fr = fr->fr_next;
9351 } while (fr && fr != frag_now);
9352 }
9353
9354 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
9355}
9356
e379e5f3 9357/* Return 1 for test, and, cmp, add, sub, inc and dec which may
79d72f45
HL
9358 be macro-fused with conditional jumps.
9359 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
9360 or is one of the following format:
9361
9362 cmp m, imm
9363 add m, imm
9364 sub m, imm
9365 test m, imm
9366 and m, imm
9367 inc m
9368 dec m
9369
9370 it is unfusible. */
e379e5f3
L
9371
9372static int
79d72f45 9373maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
9374{
9375 /* No RIP address. */
9376 if (i.base_reg && i.base_reg->reg_num == RegIP)
9377 return 0;
9378
389d00a5 9379 /* No opcodes outside of base encoding space. */
ddb62495 9380 if (i.tm.opcode_space != SPACE_BASE)
e379e5f3
L
9381 return 0;
9382
79d72f45
HL
9383 /* add, sub without add/sub m, imm. */
9384 if (i.tm.base_opcode <= 5
e379e5f3
L
9385 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
9386 || ((i.tm.base_opcode | 3) == 0x83
79d72f45 9387 && (i.tm.extension_opcode == 0x5
e379e5f3 9388 || i.tm.extension_opcode == 0x0)))
79d72f45
HL
9389 {
9390 *mf_cmp_p = mf_cmp_alu_cmp;
9391 return !(i.mem_operands && i.imm_operands);
9392 }
e379e5f3 9393
79d72f45
HL
9394 /* and without and m, imm. */
9395 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
9396 || ((i.tm.base_opcode | 3) == 0x83
9397 && i.tm.extension_opcode == 0x4))
9398 {
9399 *mf_cmp_p = mf_cmp_test_and;
9400 return !(i.mem_operands && i.imm_operands);
9401 }
9402
9403 /* test without test m imm. */
e379e5f3
L
9404 if ((i.tm.base_opcode | 1) == 0x85
9405 || (i.tm.base_opcode | 1) == 0xa9
9406 || ((i.tm.base_opcode | 1) == 0xf7
79d72f45
HL
9407 && i.tm.extension_opcode == 0))
9408 {
9409 *mf_cmp_p = mf_cmp_test_and;
9410 return !(i.mem_operands && i.imm_operands);
9411 }
9412
9413 /* cmp without cmp m, imm. */
9414 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
e379e5f3
L
9415 || ((i.tm.base_opcode | 3) == 0x83
9416 && (i.tm.extension_opcode == 0x7)))
79d72f45
HL
9417 {
9418 *mf_cmp_p = mf_cmp_alu_cmp;
9419 return !(i.mem_operands && i.imm_operands);
9420 }
e379e5f3 9421
79d72f45 9422 /* inc, dec without inc/dec m. */
e379e5f3
L
9423 if ((i.tm.cpu_flags.bitfield.cpuno64
9424 && (i.tm.base_opcode | 0xf) == 0x4f)
9425 || ((i.tm.base_opcode | 1) == 0xff
9426 && i.tm.extension_opcode <= 0x1))
79d72f45
HL
9427 {
9428 *mf_cmp_p = mf_cmp_incdec;
9429 return !i.mem_operands;
9430 }
e379e5f3
L
9431
9432 return 0;
9433}
9434
9435/* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
9436
9437static int
79d72f45 9438add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
9439{
9440 /* NB: Don't work with COND_JUMP86 without i386. */
9441 if (!align_branch_power
9442 || now_seg == absolute_section
9443 || !cpu_arch_flags.bitfield.cpui386
9444 || !(align_branch & align_branch_fused_bit))
9445 return 0;
9446
79d72f45 9447 if (maybe_fused_with_jcc_p (mf_cmp_p))
e379e5f3
L
9448 {
9449 if (last_insn.kind == last_insn_other
9450 || last_insn.seg != now_seg)
9451 return 1;
9452 if (flag_debug)
9453 as_warn_where (last_insn.file, last_insn.line,
9454 _("`%s` skips -malign-branch-boundary on `%s`"),
76d3f746 9455 last_insn.name, insn_name (&i.tm));
e379e5f3
L
9456 }
9457
9458 return 0;
9459}
9460
9461/* Return 1 if a BRANCH_PREFIX frag should be generated. */
9462
9463static int
9464add_branch_prefix_frag_p (void)
9465{
9466 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
9467 to PadLock instructions since they include prefixes in opcode. */
9468 if (!align_branch_power
9469 || !align_branch_prefix_size
9470 || now_seg == absolute_section
9471 || i.tm.cpu_flags.bitfield.cpupadlock
9472 || !cpu_arch_flags.bitfield.cpui386)
9473 return 0;
9474
9475 /* Don't add prefix if it is a prefix or there is no operand in case
9476 that segment prefix is special. */
9477 if (!i.operands || i.tm.opcode_modifier.isprefix)
9478 return 0;
9479
9480 if (last_insn.kind == last_insn_other
9481 || last_insn.seg != now_seg)
9482 return 1;
9483
9484 if (flag_debug)
9485 as_warn_where (last_insn.file, last_insn.line,
9486 _("`%s` skips -malign-branch-boundary on `%s`"),
76d3f746 9487 last_insn.name, insn_name (&i.tm));
e379e5f3
L
9488
9489 return 0;
9490}
9491
9492/* Return 1 if a BRANCH_PADDING frag should be generated. */
9493
9494static int
79d72f45
HL
9495add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9496 enum mf_jcc_kind *mf_jcc_p)
e379e5f3
L
9497{
9498 int add_padding;
9499
9500 /* NB: Don't work with COND_JUMP86 without i386. */
9501 if (!align_branch_power
9502 || now_seg == absolute_section
389d00a5 9503 || !cpu_arch_flags.bitfield.cpui386
ddb62495 9504 || i.tm.opcode_space != SPACE_BASE)
e379e5f3
L
9505 return 0;
9506
9507 add_padding = 0;
9508
9509 /* Check for jcc and direct jmp. */
9510 if (i.tm.opcode_modifier.jump == JUMP)
9511 {
9512 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9513 {
9514 *branch_p = align_branch_jmp;
9515 add_padding = align_branch & align_branch_jmp_bit;
9516 }
9517 else
9518 {
79d72f45
HL
9519 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9520 igore the lowest bit. */
9521 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
e379e5f3
L
9522 *branch_p = align_branch_jcc;
9523 if ((align_branch & align_branch_jcc_bit))
9524 add_padding = 1;
9525 }
9526 }
e379e5f3
L
9527 else if ((i.tm.base_opcode | 1) == 0xc3)
9528 {
9529 /* Near ret. */
9530 *branch_p = align_branch_ret;
9531 if ((align_branch & align_branch_ret_bit))
9532 add_padding = 1;
9533 }
9534 else
9535 {
9536 /* Check for indirect jmp, direct and indirect calls. */
9537 if (i.tm.base_opcode == 0xe8)
9538 {
9539 /* Direct call. */
9540 *branch_p = align_branch_call;
9541 if ((align_branch & align_branch_call_bit))
9542 add_padding = 1;
9543 }
9544 else if (i.tm.base_opcode == 0xff
9545 && (i.tm.extension_opcode == 2
9546 || i.tm.extension_opcode == 4))
9547 {
9548 /* Indirect call and jmp. */
9549 *branch_p = align_branch_indirect;
9550 if ((align_branch & align_branch_indirect_bit))
9551 add_padding = 1;
9552 }
9553
9554 if (add_padding
9555 && i.disp_operands
9556 && tls_get_addr
9557 && (i.op[0].disps->X_op == O_symbol
9558 || (i.op[0].disps->X_op == O_subtract
9559 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9560 {
9561 symbolS *s = i.op[0].disps->X_add_symbol;
9562 /* No padding to call to global or undefined tls_get_addr. */
9563 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9564 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9565 return 0;
9566 }
9567 }
9568
9569 if (add_padding
9570 && last_insn.kind != last_insn_other
9571 && last_insn.seg == now_seg)
9572 {
9573 if (flag_debug)
9574 as_warn_where (last_insn.file, last_insn.line,
9575 _("`%s` skips -malign-branch-boundary on `%s`"),
76d3f746 9576 last_insn.name, insn_name (&i.tm));
e379e5f3
L
9577 return 0;
9578 }
9579
9580 return add_padding;
9581}
9582
29b0f896 9583static void
e3bb37b5 9584output_insn (void)
29b0f896 9585{
2bbd9c25
JJ
9586 fragS *insn_start_frag;
9587 offsetT insn_start_off;
e379e5f3
L
9588 fragS *fragP = NULL;
9589 enum align_branch_kind branch = align_branch_none;
79d72f45
HL
9590 /* The initializer is arbitrary just to avoid uninitialized error.
9591 it's actually either assigned in add_branch_padding_frag_p
9592 or never be used. */
9593 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
2bbd9c25 9594
b4a3a7b4 9595#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
48ef937e 9596 if (IS_ELF && x86_used_note && now_seg != absolute_section)
b4a3a7b4 9597 {
32930e4e
L
9598 if ((i.xstate & xstate_tmm) == xstate_tmm
9599 || i.tm.cpu_flags.bitfield.cpuamx_tile)
9600 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9601
b4a3a7b4
L
9602 if (i.tm.cpu_flags.bitfield.cpu8087
9603 || i.tm.cpu_flags.bitfield.cpu287
9604 || i.tm.cpu_flags.bitfield.cpu387
9605 || i.tm.cpu_flags.bitfield.cpu687
9606 || i.tm.cpu_flags.bitfield.cpufisttp)
9607 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
014d61ea 9608
921eafea 9609 if ((i.xstate & xstate_mmx)
7fc69528
JB
9610 || i.tm.mnem_off == MN_emms
9611 || i.tm.mnem_off == MN_femms)
b4a3a7b4 9612 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
014d61ea 9613
32930e4e
L
9614 if (i.index_reg)
9615 {
9616 if (i.index_reg->reg_type.bitfield.zmmword)
9617 i.xstate |= xstate_zmm;
9618 else if (i.index_reg->reg_type.bitfield.ymmword)
9619 i.xstate |= xstate_ymm;
9620 else if (i.index_reg->reg_type.bitfield.xmmword)
9621 i.xstate |= xstate_xmm;
9622 }
014d61ea
JB
9623
9624 /* vzeroall / vzeroupper */
9625 if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9626 i.xstate |= xstate_ymm;
9627
c4694f17 9628 if ((i.xstate & xstate_xmm)
389d00a5
JB
9629 /* ldmxcsr / stmxcsr / vldmxcsr / vstmxcsr */
9630 || (i.tm.base_opcode == 0xae
9631 && (i.tm.cpu_flags.bitfield.cpusse
9632 || i.tm.cpu_flags.bitfield.cpuavx))
c4694f17
TG
9633 || i.tm.cpu_flags.bitfield.cpuwidekl
9634 || i.tm.cpu_flags.bitfield.cpukl)
b4a3a7b4 9635 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
014d61ea 9636
921eafea 9637 if ((i.xstate & xstate_ymm) == xstate_ymm)
b4a3a7b4 9638 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
921eafea 9639 if ((i.xstate & xstate_zmm) == xstate_zmm)
b4a3a7b4 9640 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
6225c532 9641 if (i.mask.reg || (i.xstate & xstate_mask) == xstate_mask)
32930e4e 9642 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
b4a3a7b4
L
9643 if (i.tm.cpu_flags.bitfield.cpufxsr)
9644 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9645 if (i.tm.cpu_flags.bitfield.cpuxsave)
9646 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9647 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9648 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9649 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9650 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
b0ab0693
L
9651
9652 if (x86_feature_2_used
9653 || i.tm.cpu_flags.bitfield.cpucmov
9654 || i.tm.cpu_flags.bitfield.cpusyscall
7fc69528 9655 || i.tm.mnem_off == MN_cmpxchg8b)
b0ab0693
L
9656 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9657 if (i.tm.cpu_flags.bitfield.cpusse3
9658 || i.tm.cpu_flags.bitfield.cpussse3
9659 || i.tm.cpu_flags.bitfield.cpusse4_1
9660 || i.tm.cpu_flags.bitfield.cpusse4_2
9661 || i.tm.cpu_flags.bitfield.cpucx16
9662 || i.tm.cpu_flags.bitfield.cpupopcnt
9663 /* LAHF-SAHF insns in 64-bit mode. */
9664 || (flag_code == CODE_64BIT
35648716 9665 && (i.tm.base_opcode | 1) == 0x9f
ddb62495 9666 && i.tm.opcode_space == SPACE_BASE))
b0ab0693
L
9667 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9668 if (i.tm.cpu_flags.bitfield.cpuavx
9669 || i.tm.cpu_flags.bitfield.cpuavx2
a9860005
JB
9670 /* Any VEX encoded insns execpt for AVX512F, AVX512BW, AVX512DQ,
9671 XOP, FMA4, LPW, TBM, and AMX. */
b0ab0693
L
9672 || (i.tm.opcode_modifier.vex
9673 && !i.tm.cpu_flags.bitfield.cpuavx512f
9674 && !i.tm.cpu_flags.bitfield.cpuavx512bw
9675 && !i.tm.cpu_flags.bitfield.cpuavx512dq
a9860005
JB
9676 && !i.tm.cpu_flags.bitfield.cpuxop
9677 && !i.tm.cpu_flags.bitfield.cpufma4
b0ab0693
L
9678 && !i.tm.cpu_flags.bitfield.cpulwp
9679 && !i.tm.cpu_flags.bitfield.cputbm
9680 && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9681 || i.tm.cpu_flags.bitfield.cpuf16c
9682 || i.tm.cpu_flags.bitfield.cpufma
9683 || i.tm.cpu_flags.bitfield.cpulzcnt
9684 || i.tm.cpu_flags.bitfield.cpumovbe
9685 || i.tm.cpu_flags.bitfield.cpuxsaves
9686 || (x86_feature_2_used
9687 & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9688 | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9689 | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9690 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9691 if (i.tm.cpu_flags.bitfield.cpuavx512f
9692 || i.tm.cpu_flags.bitfield.cpuavx512bw
9693 || i.tm.cpu_flags.bitfield.cpuavx512dq
9694 || i.tm.cpu_flags.bitfield.cpuavx512vl
a9860005
JB
9695 /* Any EVEX encoded insns except for AVX512ER, AVX512PF,
9696 AVX512-4FMAPS, and AVX512-4VNNIW. */
b0ab0693
L
9697 || (i.tm.opcode_modifier.evex
9698 && !i.tm.cpu_flags.bitfield.cpuavx512er
9699 && !i.tm.cpu_flags.bitfield.cpuavx512pf
a9860005 9700 && !i.tm.cpu_flags.bitfield.cpuavx512_4fmaps
b0ab0693
L
9701 && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9702 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
b4a3a7b4
L
9703 }
9704#endif
9705
29b0f896
AM
9706 /* Tie dwarf2 debug info to the address at the start of the insn.
9707 We can't do this after the insn has been output as the current
9708 frag may have been closed off. eg. by frag_var. */
9709 dwarf2_emit_insn (0);
9710
2bbd9c25
JJ
9711 insn_start_frag = frag_now;
9712 insn_start_off = frag_now_fix ();
9713
79d72f45 9714 if (add_branch_padding_frag_p (&branch, &mf_jcc))
e379e5f3
L
9715 {
9716 char *p;
9717 /* Branch can be 8 bytes. Leave some room for prefixes. */
9718 unsigned int max_branch_padding_size = 14;
9719
9720 /* Align section to boundary. */
9721 record_alignment (now_seg, align_branch_power);
9722
9723 /* Make room for padding. */
9724 frag_grow (max_branch_padding_size);
9725
9726 /* Start of the padding. */
9727 p = frag_more (0);
9728
9729 fragP = frag_now;
9730
9731 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9732 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9733 NULL, 0, p);
9734
79d72f45 9735 fragP->tc_frag_data.mf_type = mf_jcc;
e379e5f3
L
9736 fragP->tc_frag_data.branch_type = branch;
9737 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9738 }
9739
d59a54c2
JB
9740 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT)
9741 && !pre_386_16bit_warned)
9742 {
9743 as_warn (_("use .code16 to ensure correct addressing mode"));
9744 pre_386_16bit_warned = true;
9745 }
9746
29b0f896 9747 /* Output jumps. */
0cfa3eb3 9748 if (i.tm.opcode_modifier.jump == JUMP)
29b0f896 9749 output_branch ();
0cfa3eb3
JB
9750 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9751 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896 9752 output_jump ();
0cfa3eb3 9753 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
29b0f896
AM
9754 output_interseg_jump ();
9755 else
9756 {
9757 /* Output normal instructions here. */
9758 char *p;
9759 unsigned char *q;
47465058 9760 unsigned int j;
79d72f45 9761 enum mf_cmp_kind mf_cmp;
4dffcebc 9762
e4e00185 9763 if (avoid_fence
389d00a5
JB
9764 && (i.tm.base_opcode == 0xaee8
9765 || i.tm.base_opcode == 0xaef0
9766 || i.tm.base_opcode == 0xaef8))
48ef937e
JB
9767 {
9768 /* Encode lfence, mfence, and sfence as
9769 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
47f4115a 9770 if (flag_code == CODE_16BIT)
76d3f746 9771 as_bad (_("Cannot convert `%s' in 16-bit mode"), insn_name (&i.tm));
47f4115a
JB
9772 else if (omit_lock_prefix)
9773 as_bad (_("Cannot convert `%s' with `-momit-lock-prefix=yes' in effect"),
76d3f746 9774 insn_name (&i.tm));
47f4115a 9775 else if (now_seg != absolute_section)
48ef937e
JB
9776 {
9777 offsetT val = 0x240483f0ULL;
9778
9779 p = frag_more (5);
9780 md_number_to_chars (p, val, 5);
9781 }
9782 else
9783 abs_section_offset += 5;
9784 return;
9785 }
e4e00185 9786
d022bddd
IT
9787 /* Some processors fail on LOCK prefix. This options makes
9788 assembler ignore LOCK prefix and serves as a workaround. */
9789 if (omit_lock_prefix)
9790 {
35648716
JB
9791 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE
9792 && i.tm.opcode_modifier.isprefix)
d022bddd
IT
9793 return;
9794 i.prefix[LOCK_PREFIX] = 0;
9795 }
9796
e379e5f3
L
9797 if (branch)
9798 /* Skip if this is a branch. */
9799 ;
79d72f45 9800 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
e379e5f3
L
9801 {
9802 /* Make room for padding. */
9803 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9804 p = frag_more (0);
9805
9806 fragP = frag_now;
9807
9808 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9809 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9810 NULL, 0, p);
9811
79d72f45 9812 fragP->tc_frag_data.mf_type = mf_cmp;
e379e5f3
L
9813 fragP->tc_frag_data.branch_type = align_branch_fused;
9814 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9815 }
9816 else if (add_branch_prefix_frag_p ())
9817 {
9818 unsigned int max_prefix_size = align_branch_prefix_size;
9819
9820 /* Make room for padding. */
9821 frag_grow (max_prefix_size);
9822 p = frag_more (0);
9823
9824 fragP = frag_now;
9825
9826 frag_var (rs_machine_dependent, max_prefix_size, 0,
9827 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9828 NULL, 0, p);
9829
9830 fragP->tc_frag_data.max_bytes = max_prefix_size;
9831 }
9832
43234a1e
L
9833 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9834 don't need the explicit prefix. */
cf665fee 9835 if (!is_any_vex_encoding (&i.tm))
bc4bd9ab 9836 {
7b47a312 9837 switch (i.tm.opcode_modifier.opcodeprefix)
bc4bd9ab 9838 {
7b47a312
L
9839 case PREFIX_0X66:
9840 add_prefix (0x66);
9841 break;
9842 case PREFIX_0XF2:
9843 add_prefix (0xf2);
9844 break;
9845 case PREFIX_0XF3:
8b65b895
L
9846 if (!i.tm.cpu_flags.bitfield.cpupadlock
9847 || (i.prefix[REP_PREFIX] != 0xf3))
9848 add_prefix (0xf3);
c0f3af97 9849 break;
7b47a312 9850 case PREFIX_NONE:
9a182d04 9851 switch (i.opcode_length)
c0f3af97 9852 {
7b47a312 9853 case 2:
7b47a312 9854 break;
9a182d04 9855 case 1:
7b47a312 9856 /* Check for pseudo prefixes. */
9a182d04
JB
9857 if (!i.tm.opcode_modifier.isprefix || i.tm.base_opcode)
9858 break;
7b47a312
L
9859 as_bad_where (insn_start_frag->fr_file,
9860 insn_start_frag->fr_line,
9861 _("pseudo prefix without instruction"));
9862 return;
9863 default:
9864 abort ();
4dffcebc 9865 }
c0f3af97 9866 break;
c0f3af97
L
9867 default:
9868 abort ();
bc4bd9ab 9869 }
c0f3af97 9870
6d19a37a 9871#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
cf61b747
L
9872 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9873 R_X86_64_GOTTPOFF relocation so that linker can safely
14470f07
L
9874 perform IE->LE optimization. A dummy REX_OPCODE prefix
9875 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9876 relocation for GDesc -> IE/LE optimization. */
cf61b747
L
9877 if (x86_elf_abi == X86_64_X32_ABI
9878 && i.operands == 2
14470f07
L
9879 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9880 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
cf61b747
L
9881 && i.prefix[REX_PREFIX] == 0)
9882 add_prefix (REX_OPCODE);
6d19a37a 9883#endif
cf61b747 9884
c0f3af97
L
9885 /* The prefix bytes. */
9886 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9887 if (*q)
48ef937e 9888 frag_opcode_byte (*q);
0f10071e 9889 }
ae5c1c7b 9890 else
c0f3af97
L
9891 {
9892 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9893 if (*q)
9894 switch (j)
9895 {
c0f3af97
L
9896 case SEG_PREFIX:
9897 case ADDR_PREFIX:
48ef937e 9898 frag_opcode_byte (*q);
c0f3af97
L
9899 break;
9900 default:
9901 /* There should be no other prefixes for instructions
9902 with VEX prefix. */
9903 abort ();
9904 }
9905
43234a1e
L
9906 /* For EVEX instructions i.vrex should become 0 after
9907 build_evex_prefix. For VEX instructions upper 16 registers
9908 aren't available, so VREX should be 0. */
9909 if (i.vrex)
9910 abort ();
c0f3af97 9911 /* Now the VEX prefix. */
48ef937e
JB
9912 if (now_seg != absolute_section)
9913 {
9914 p = frag_more (i.vex.length);
9915 for (j = 0; j < i.vex.length; j++)
9916 p[j] = i.vex.bytes[j];
9917 }
9918 else
9919 abs_section_offset += i.vex.length;
c0f3af97 9920 }
252b5132 9921
29b0f896 9922 /* Now the opcode; be careful about word order here! */
389d00a5
JB
9923 j = i.opcode_length;
9924 if (!i.vex.length)
ddb62495 9925 switch (i.tm.opcode_space)
389d00a5
JB
9926 {
9927 case SPACE_BASE:
9928 break;
9929 case SPACE_0F:
9930 ++j;
9931 break;
9932 case SPACE_0F38:
9933 case SPACE_0F3A:
9934 j += 2;
9935 break;
9936 default:
9937 abort ();
9938 }
9939
48ef937e 9940 if (now_seg == absolute_section)
389d00a5
JB
9941 abs_section_offset += j;
9942 else if (j == 1)
29b0f896
AM
9943 {
9944 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9945 }
9946 else
9947 {
389d00a5
JB
9948 p = frag_more (j);
9949 if (!i.vex.length
ddb62495 9950 && i.tm.opcode_space != SPACE_BASE)
389d00a5
JB
9951 {
9952 *p++ = 0x0f;
ddb62495
JB
9953 if (i.tm.opcode_space != SPACE_0F)
9954 *p++ = i.tm.opcode_space == SPACE_0F38
389d00a5
JB
9955 ? 0x38 : 0x3a;
9956 }
9957
9a182d04 9958 switch (i.opcode_length)
331d2d0d 9959 {
4dffcebc 9960 case 2:
389d00a5
JB
9961 /* Put out high byte first: can't use md_number_to_chars! */
9962 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9963 /* Fall through. */
9964 case 1:
9965 *p = i.tm.base_opcode & 0xff;
4dffcebc
L
9966 break;
9967 default:
9968 abort ();
9969 break;
331d2d0d 9970 }
0f10071e 9971
29b0f896 9972 }
3e73aa7c 9973
29b0f896 9974 /* Now the modrm byte and sib byte (if present). */
40fb9820 9975 if (i.tm.opcode_modifier.modrm)
29b0f896 9976 {
48ef937e
JB
9977 frag_opcode_byte ((i.rm.regmem << 0)
9978 | (i.rm.reg << 3)
9979 | (i.rm.mode << 6));
29b0f896
AM
9980 /* If i.rm.regmem == ESP (4)
9981 && i.rm.mode != (Register mode)
9982 && not 16 bit
9983 ==> need second modrm byte. */
9984 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9985 && i.rm.mode != 3
dc821c5f 9986 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
48ef937e
JB
9987 frag_opcode_byte ((i.sib.base << 0)
9988 | (i.sib.index << 3)
9989 | (i.sib.scale << 6));
29b0f896 9990 }
3e73aa7c 9991
29b0f896 9992 if (i.disp_operands)
2bbd9c25 9993 output_disp (insn_start_frag, insn_start_off);
3e73aa7c 9994
29b0f896 9995 if (i.imm_operands)
2bbd9c25 9996 output_imm (insn_start_frag, insn_start_off);
9c33702b
JB
9997
9998 /*
9999 * frag_now_fix () returning plain abs_section_offset when we're in the
10000 * absolute section, and abs_section_offset not getting updated as data
10001 * gets added to the frag breaks the logic below.
10002 */
10003 if (now_seg != absolute_section)
10004 {
10005 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
10006 if (j > 15)
10007 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
10008 j);
e379e5f3
L
10009 else if (fragP)
10010 {
10011 /* NB: Don't add prefix with GOTPC relocation since
10012 output_disp() above depends on the fixed encoding
10013 length. Can't add prefix with TLS relocation since
10014 it breaks TLS linker optimization. */
10015 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
10016 /* Prefix count on the current instruction. */
10017 unsigned int count = i.vex.length;
10018 unsigned int k;
10019 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
10020 /* REX byte is encoded in VEX/EVEX prefix. */
10021 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
10022 count++;
10023
10024 /* Count prefixes for extended opcode maps. */
10025 if (!i.vex.length)
ddb62495 10026 switch (i.tm.opcode_space)
e379e5f3 10027 {
389d00a5 10028 case SPACE_BASE:
e379e5f3 10029 break;
389d00a5
JB
10030 case SPACE_0F:
10031 count++;
e379e5f3 10032 break;
389d00a5
JB
10033 case SPACE_0F38:
10034 case SPACE_0F3A:
10035 count += 2;
e379e5f3
L
10036 break;
10037 default:
10038 abort ();
10039 }
10040
10041 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10042 == BRANCH_PREFIX)
10043 {
10044 /* Set the maximum prefix size in BRANCH_PREFIX
10045 frag. */
10046 if (fragP->tc_frag_data.max_bytes > max)
10047 fragP->tc_frag_data.max_bytes = max;
10048 if (fragP->tc_frag_data.max_bytes > count)
10049 fragP->tc_frag_data.max_bytes -= count;
10050 else
10051 fragP->tc_frag_data.max_bytes = 0;
10052 }
10053 else
10054 {
10055 /* Remember the maximum prefix size in FUSED_JCC_PADDING
10056 frag. */
10057 unsigned int max_prefix_size;
10058 if (align_branch_prefix_size > max)
10059 max_prefix_size = max;
10060 else
10061 max_prefix_size = align_branch_prefix_size;
10062 if (max_prefix_size > count)
10063 fragP->tc_frag_data.max_prefix_length
10064 = max_prefix_size - count;
10065 }
10066
10067 /* Use existing segment prefix if possible. Use CS
10068 segment prefix in 64-bit mode. In 32-bit mode, use SS
10069 segment prefix with ESP/EBP base register and use DS
10070 segment prefix without ESP/EBP base register. */
10071 if (i.prefix[SEG_PREFIX])
10072 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
10073 else if (flag_code == CODE_64BIT)
10074 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
10075 else if (i.base_reg
10076 && (i.base_reg->reg_num == 4
10077 || i.base_reg->reg_num == 5))
10078 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
10079 else
10080 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
10081 }
9c33702b 10082 }
29b0f896 10083 }
252b5132 10084
e379e5f3
L
10085 /* NB: Don't work with COND_JUMP86 without i386. */
10086 if (align_branch_power
10087 && now_seg != absolute_section
10088 && cpu_arch_flags.bitfield.cpui386)
10089 {
10090 /* Terminate each frag so that we can add prefix and check for
10091 fused jcc. */
10092 frag_wane (frag_now);
10093 frag_new (0);
10094 }
10095
29b0f896
AM
10096#ifdef DEBUG386
10097 if (flag_debug)
10098 {
7b81dfbb 10099 pi ("" /*line*/, &i);
29b0f896
AM
10100 }
10101#endif /* DEBUG386 */
10102}
252b5132 10103
e205caa7
L
10104/* Return the size of the displacement operand N. */
10105
10106static int
10107disp_size (unsigned int n)
10108{
10109 int size = 4;
43234a1e 10110
b5014f7a 10111 if (i.types[n].bitfield.disp64)
40fb9820
L
10112 size = 8;
10113 else if (i.types[n].bitfield.disp8)
10114 size = 1;
10115 else if (i.types[n].bitfield.disp16)
10116 size = 2;
e205caa7
L
10117 return size;
10118}
10119
10120/* Return the size of the immediate operand N. */
10121
10122static int
10123imm_size (unsigned int n)
10124{
10125 int size = 4;
40fb9820
L
10126 if (i.types[n].bitfield.imm64)
10127 size = 8;
10128 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
10129 size = 1;
10130 else if (i.types[n].bitfield.imm16)
10131 size = 2;
e205caa7
L
10132 return size;
10133}
10134
29b0f896 10135static void
64e74474 10136output_disp (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
10137{
10138 char *p;
10139 unsigned int n;
252b5132 10140
29b0f896
AM
10141 for (n = 0; n < i.operands; n++)
10142 {
b5014f7a 10143 if (operand_type_check (i.types[n], disp))
29b0f896 10144 {
48ef937e
JB
10145 int size = disp_size (n);
10146
10147 if (now_seg == absolute_section)
10148 abs_section_offset += size;
10149 else if (i.op[n].disps->X_op == O_constant)
29b0f896 10150 {
43234a1e 10151 offsetT val = i.op[n].disps->X_add_number;
252b5132 10152
629cfaf1
JB
10153 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
10154 size);
29b0f896
AM
10155 p = frag_more (size);
10156 md_number_to_chars (p, val, size);
10157 }
10158 else
10159 {
f86103b7 10160 enum bfd_reloc_code_real reloc_type;
a775efc8
JB
10161 bool pcrel = (i.flags[n] & Operand_PCrel) != 0;
10162 bool sign = (flag_code == CODE_64BIT && size == 4
10163 && (!want_disp32 (&i.tm)
10164 || (i.tm.opcode_modifier.jump && !i.jumpabsolute
10165 && !i.types[n].bitfield.baseindex)))
10166 || pcrel;
02a86693 10167 fixS *fixP;
29b0f896 10168
e205caa7 10169 /* We can't have 8 bit displacement here. */
9c2799c2 10170 gas_assert (!i.types[n].bitfield.disp8);
e205caa7 10171
29b0f896
AM
10172 /* The PC relative address is computed relative
10173 to the instruction boundary, so in case immediate
10174 fields follows, we need to adjust the value. */
10175 if (pcrel && i.imm_operands)
10176 {
29b0f896 10177 unsigned int n1;
e205caa7 10178 int sz = 0;
252b5132 10179
29b0f896 10180 for (n1 = 0; n1 < i.operands; n1++)
40fb9820 10181 if (operand_type_check (i.types[n1], imm))
252b5132 10182 {
e205caa7
L
10183 /* Only one immediate is allowed for PC
10184 relative address. */
9c2799c2 10185 gas_assert (sz == 0);
e205caa7
L
10186 sz = imm_size (n1);
10187 i.op[n].disps->X_add_number -= sz;
252b5132 10188 }
29b0f896 10189 /* We should find the immediate. */
9c2799c2 10190 gas_assert (sz != 0);
29b0f896 10191 }
520dc8e8 10192
29b0f896 10193 p = frag_more (size);
d258b828 10194 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
d6ab8113 10195 if (GOT_symbol
2bbd9c25 10196 && GOT_symbol == i.op[n].disps->X_add_symbol
d6ab8113 10197 && (((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
10198 || reloc_type == BFD_RELOC_X86_64_32S
10199 || (reloc_type == BFD_RELOC_64
10200 && object_64bit))
d6ab8113
JB
10201 && (i.op[n].disps->X_op == O_symbol
10202 || (i.op[n].disps->X_op == O_add
10203 && ((symbol_get_value_expression
10204 (i.op[n].disps->X_op_symbol)->X_op)
10205 == O_subtract))))
10206 || reloc_type == BFD_RELOC_32_PCREL))
2bbd9c25 10207 {
4fa24527 10208 if (!object_64bit)
7b81dfbb
AJ
10209 {
10210 reloc_type = BFD_RELOC_386_GOTPC;
5b7c81bd 10211 i.has_gotpc_tls_reloc = true;
98da05bf 10212 i.op[n].disps->X_add_number +=
d583596c 10213 encoding_length (insn_start_frag, insn_start_off, p);
7b81dfbb
AJ
10214 }
10215 else if (reloc_type == BFD_RELOC_64)
10216 reloc_type = BFD_RELOC_X86_64_GOTPC64;
d6ab8113 10217 else
7b81dfbb
AJ
10218 /* Don't do the adjustment for x86-64, as there
10219 the pcrel addressing is relative to the _next_
10220 insn, and that is taken care of in other code. */
d6ab8113 10221 reloc_type = BFD_RELOC_X86_64_GOTPC32;
2bbd9c25 10222 }
e379e5f3
L
10223 else if (align_branch_power)
10224 {
10225 switch (reloc_type)
10226 {
10227 case BFD_RELOC_386_TLS_GD:
10228 case BFD_RELOC_386_TLS_LDM:
10229 case BFD_RELOC_386_TLS_IE:
10230 case BFD_RELOC_386_TLS_IE_32:
10231 case BFD_RELOC_386_TLS_GOTIE:
10232 case BFD_RELOC_386_TLS_GOTDESC:
10233 case BFD_RELOC_386_TLS_DESC_CALL:
10234 case BFD_RELOC_X86_64_TLSGD:
10235 case BFD_RELOC_X86_64_TLSLD:
10236 case BFD_RELOC_X86_64_GOTTPOFF:
10237 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10238 case BFD_RELOC_X86_64_TLSDESC_CALL:
5b7c81bd 10239 i.has_gotpc_tls_reloc = true;
e379e5f3
L
10240 default:
10241 break;
10242 }
10243 }
02a86693
L
10244 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
10245 size, i.op[n].disps, pcrel,
10246 reloc_type);
eb19308f
JB
10247
10248 if (flag_code == CODE_64BIT && size == 4 && pcrel
10249 && !i.prefix[ADDR_PREFIX])
10250 fixP->fx_signed = 1;
10251
02a86693
L
10252 /* Check for "call/jmp *mem", "mov mem, %reg",
10253 "test %reg, mem" and "binop mem, %reg" where binop
10254 is one of adc, add, and, cmp, or, sbb, sub, xor
e60f4d3b
L
10255 instructions without data prefix. Always generate
10256 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
10257 if (i.prefix[DATA_PREFIX] == 0
10258 && (generate_relax_relocations
10259 || (!object_64bit
10260 && i.rm.mode == 0
10261 && i.rm.regmem == 5))
0cb4071e
L
10262 && (i.rm.mode == 2
10263 || (i.rm.mode == 0 && i.rm.regmem == 5))
ddb62495 10264 && i.tm.opcode_space == SPACE_BASE
02a86693
L
10265 && ((i.operands == 1
10266 && i.tm.base_opcode == 0xff
10267 && (i.rm.reg == 2 || i.rm.reg == 4))
10268 || (i.operands == 2
10269 && (i.tm.base_opcode == 0x8b
10270 || i.tm.base_opcode == 0x85
2ae4c703 10271 || (i.tm.base_opcode & ~0x38) == 0x03))))
02a86693
L
10272 {
10273 if (object_64bit)
10274 {
10275 fixP->fx_tcbit = i.rex != 0;
10276 if (i.base_reg
e968fc9b 10277 && (i.base_reg->reg_num == RegIP))
02a86693
L
10278 fixP->fx_tcbit2 = 1;
10279 }
10280 else
10281 fixP->fx_tcbit2 = 1;
10282 }
29b0f896
AM
10283 }
10284 }
10285 }
10286}
252b5132 10287
29b0f896 10288static void
64e74474 10289output_imm (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
10290{
10291 char *p;
10292 unsigned int n;
252b5132 10293
29b0f896
AM
10294 for (n = 0; n < i.operands; n++)
10295 {
40fb9820 10296 if (operand_type_check (i.types[n], imm))
29b0f896 10297 {
48ef937e
JB
10298 int size = imm_size (n);
10299
10300 if (now_seg == absolute_section)
10301 abs_section_offset += size;
10302 else if (i.op[n].imms->X_op == O_constant)
29b0f896 10303 {
29b0f896 10304 offsetT val;
b4cac588 10305
29b0f896
AM
10306 val = offset_in_range (i.op[n].imms->X_add_number,
10307 size);
10308 p = frag_more (size);
10309 md_number_to_chars (p, val, size);
10310 }
10311 else
10312 {
10313 /* Not absolute_section.
10314 Need a 32-bit fixup (don't support 8bit
10315 non-absolute imms). Try to support other
10316 sizes ... */
f86103b7 10317 enum bfd_reloc_code_real reloc_type;
e205caa7 10318 int sign;
29b0f896 10319
40fb9820 10320 if (i.types[n].bitfield.imm32s
a7d61044 10321 && (i.suffix == QWORD_MNEM_SUFFIX
40fb9820 10322 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
29b0f896 10323 sign = 1;
e205caa7
L
10324 else
10325 sign = 0;
520dc8e8 10326
29b0f896 10327 p = frag_more (size);
d258b828 10328 reloc_type = reloc (size, 0, sign, i.reloc[n]);
f86103b7 10329
2bbd9c25
JJ
10330 /* This is tough to explain. We end up with this one if we
10331 * have operands that look like
10332 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
10333 * obtain the absolute address of the GOT, and it is strongly
10334 * preferable from a performance point of view to avoid using
10335 * a runtime relocation for this. The actual sequence of
10336 * instructions often look something like:
10337 *
10338 * call .L66
10339 * .L66:
10340 * popl %ebx
10341 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
10342 *
10343 * The call and pop essentially return the absolute address
10344 * of the label .L66 and store it in %ebx. The linker itself
10345 * will ultimately change the first operand of the addl so
10346 * that %ebx points to the GOT, but to keep things simple, the
10347 * .o file must have this operand set so that it generates not
10348 * the absolute address of .L66, but the absolute address of
10349 * itself. This allows the linker itself simply treat a GOTPC
10350 * relocation as asking for a pcrel offset to the GOT to be
10351 * added in, and the addend of the relocation is stored in the
10352 * operand field for the instruction itself.
10353 *
10354 * Our job here is to fix the operand so that it would add
10355 * the correct offset so that %ebx would point to itself. The
10356 * thing that is tricky is that .-.L66 will point to the
10357 * beginning of the instruction, so we need to further modify
10358 * the operand so that it will point to itself. There are
10359 * other cases where you have something like:
10360 *
10361 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
10362 *
10363 * and here no correction would be required. Internally in
10364 * the assembler we treat operands of this form as not being
10365 * pcrel since the '.' is explicitly mentioned, and I wonder
10366 * whether it would simplify matters to do it this way. Who
10367 * knows. In earlier versions of the PIC patches, the
10368 * pcrel_adjust field was used to store the correction, but
10369 * since the expression is not pcrel, I felt it would be
10370 * confusing to do it this way. */
10371
d6ab8113 10372 if ((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
10373 || reloc_type == BFD_RELOC_X86_64_32S
10374 || reloc_type == BFD_RELOC_64)
29b0f896
AM
10375 && GOT_symbol
10376 && GOT_symbol == i.op[n].imms->X_add_symbol
10377 && (i.op[n].imms->X_op == O_symbol
10378 || (i.op[n].imms->X_op == O_add
10379 && ((symbol_get_value_expression
10380 (i.op[n].imms->X_op_symbol)->X_op)
10381 == O_subtract))))
10382 {
4fa24527 10383 if (!object_64bit)
d6ab8113 10384 reloc_type = BFD_RELOC_386_GOTPC;
7b81dfbb 10385 else if (size == 4)
d6ab8113 10386 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7b81dfbb
AJ
10387 else if (size == 8)
10388 reloc_type = BFD_RELOC_X86_64_GOTPC64;
5b7c81bd 10389 i.has_gotpc_tls_reloc = true;
d583596c
JB
10390 i.op[n].imms->X_add_number +=
10391 encoding_length (insn_start_frag, insn_start_off, p);
29b0f896 10392 }
29b0f896
AM
10393 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
10394 i.op[n].imms, 0, reloc_type);
10395 }
10396 }
10397 }
252b5132
RH
10398}
10399\f
d182319b
JB
10400/* x86_cons_fix_new is called via the expression parsing code when a
10401 reloc is needed. We use this hook to get the correct .got reloc. */
d182319b
JB
10402static int cons_sign = -1;
10403
10404void
e3bb37b5 10405x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
62ebcb5c 10406 expressionS *exp, bfd_reloc_code_real_type r)
d182319b 10407{
d258b828 10408 r = reloc (len, 0, cons_sign, r);
d182319b
JB
10409
10410#ifdef TE_PE
10411 if (exp->X_op == O_secrel)
10412 {
10413 exp->X_op = O_symbol;
10414 r = BFD_RELOC_32_SECREL;
10415 }
145667f8
MH
10416 else if (exp->X_op == O_secidx)
10417 r = BFD_RELOC_16_SECIDX;
d182319b
JB
10418#endif
10419
10420 fix_new_exp (frag, off, len, exp, 0, r);
10421}
10422
357d1bd8
L
10423/* Export the ABI address size for use by TC_ADDRESS_BYTES for the
10424 purpose of the `.dc.a' internal pseudo-op. */
10425
10426int
10427x86_address_bytes (void)
10428{
10429 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
10430 return 4;
10431 return stdoutput->arch_info->bits_per_address / 8;
10432}
10433
deea4973
JB
10434#if (!(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
10435 || defined (LEX_AT)) && !defined (TE_PE)
d258b828 10436# define lex_got(reloc, adjust, types) NULL
718ddfc0 10437#else
f3c180ae
AM
10438/* Parse operands of the form
10439 <symbol>@GOTOFF+<nnn>
10440 and similar .plt or .got references.
10441
10442 If we find one, set up the correct relocation in RELOC and copy the
10443 input string, minus the `@GOTOFF' into a malloc'd buffer for
10444 parsing by the calling routine. Return this buffer, and if ADJUST
10445 is non-null set it to the length of the string we removed from the
10446 input line. Otherwise return NULL. */
10447static char *
91d6fa6a 10448lex_got (enum bfd_reloc_code_real *rel,
64e74474 10449 int *adjust,
d258b828 10450 i386_operand_type *types)
f3c180ae 10451{
7b81dfbb
AJ
10452 /* Some of the relocations depend on the size of what field is to
10453 be relocated. But in our callers i386_immediate and i386_displacement
10454 we don't yet know the operand size (this will be set by insn
10455 matching). Hence we record the word32 relocation here,
10456 and adjust the reloc according to the real size in reloc(). */
145667f8
MH
10457 static const struct
10458 {
f3c180ae 10459 const char *str;
cff8d58a 10460 int len;
4fa24527 10461 const enum bfd_reloc_code_real rel[2];
40fb9820 10462 const i386_operand_type types64;
5b7c81bd 10463 bool need_GOT_symbol;
145667f8
MH
10464 }
10465 gotrel[] =
10466 {
05909f23
JB
10467
10468#define OPERAND_TYPE_IMM32_32S_DISP32 { .bitfield = \
10469 { .imm32 = 1, .imm32s = 1, .disp32 = 1 } }
10470#define OPERAND_TYPE_IMM32_32S_64_DISP32 { .bitfield = \
10471 { .imm32 = 1, .imm32s = 1, .imm64 = 1, .disp32 = 1 } }
10472#define OPERAND_TYPE_IMM32_32S_64_DISP32_64 { .bitfield = \
10473 { .imm32 = 1, .imm32s = 1, .imm64 = 1, .disp32 = 1, .disp64 = 1 } }
10474#define OPERAND_TYPE_IMM64_DISP64 { .bitfield = \
10475 { .imm64 = 1, .disp64 = 1 } }
10476
deea4973 10477#ifndef TE_PE
8ce3d284 10478#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
10479 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
10480 BFD_RELOC_SIZE32 },
05909f23 10481 { .bitfield = { .imm32 = 1, .imm64 = 1 } }, false },
8ce3d284 10482#endif
cff8d58a
L
10483 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
10484 BFD_RELOC_X86_64_PLTOFF64 },
05909f23 10485 { .bitfield = { .imm64 = 1 } }, true },
cff8d58a
L
10486 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
10487 BFD_RELOC_X86_64_PLT32 },
a775efc8 10488 OPERAND_TYPE_IMM32_32S_DISP32, false },
cff8d58a
L
10489 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
10490 BFD_RELOC_X86_64_GOTPLT64 },
5b7c81bd 10491 OPERAND_TYPE_IMM64_DISP64, true },
cff8d58a
L
10492 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
10493 BFD_RELOC_X86_64_GOTOFF64 },
5b7c81bd 10494 OPERAND_TYPE_IMM64_DISP64, true },
cff8d58a
L
10495 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10496 BFD_RELOC_X86_64_GOTPCREL },
a775efc8 10497 OPERAND_TYPE_IMM32_32S_DISP32, true },
cff8d58a
L
10498 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
10499 BFD_RELOC_X86_64_TLSGD },
a775efc8 10500 OPERAND_TYPE_IMM32_32S_DISP32, true },
cff8d58a
L
10501 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
10502 _dummy_first_bfd_reloc_code_real },
5b7c81bd 10503 OPERAND_TYPE_NONE, true },
cff8d58a
L
10504 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
10505 BFD_RELOC_X86_64_TLSLD },
a775efc8 10506 OPERAND_TYPE_IMM32_32S_DISP32, true },
cff8d58a
L
10507 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10508 BFD_RELOC_X86_64_GOTTPOFF },
a775efc8 10509 OPERAND_TYPE_IMM32_32S_DISP32, true },
cff8d58a
L
10510 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
10511 BFD_RELOC_X86_64_TPOFF32 },
a775efc8 10512 OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
cff8d58a
L
10513 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
10514 _dummy_first_bfd_reloc_code_real },
5b7c81bd 10515 OPERAND_TYPE_NONE, true },
cff8d58a
L
10516 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
10517 BFD_RELOC_X86_64_DTPOFF32 },
a775efc8 10518 OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
cff8d58a
L
10519 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10520 _dummy_first_bfd_reloc_code_real },
5b7c81bd 10521 OPERAND_TYPE_NONE, true },
cff8d58a
L
10522 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10523 _dummy_first_bfd_reloc_code_real },
5b7c81bd 10524 OPERAND_TYPE_NONE, true },
cff8d58a
L
10525 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
10526 BFD_RELOC_X86_64_GOT32 },
a775efc8 10527 OPERAND_TYPE_IMM32_32S_64_DISP32, true },
cff8d58a
L
10528 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
10529 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
a775efc8 10530 OPERAND_TYPE_IMM32_32S_DISP32, true },
cff8d58a
L
10531 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
10532 BFD_RELOC_X86_64_TLSDESC_CALL },
a775efc8 10533 OPERAND_TYPE_IMM32_32S_DISP32, true },
deea4973
JB
10534#else /* TE_PE */
10535 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10536 BFD_RELOC_32_SECREL },
a775efc8 10537 OPERAND_TYPE_IMM32_32S_64_DISP32_64, false },
deea4973 10538#endif
05909f23
JB
10539
10540#undef OPERAND_TYPE_IMM32_32S_DISP32
10541#undef OPERAND_TYPE_IMM32_32S_64_DISP32
10542#undef OPERAND_TYPE_IMM32_32S_64_DISP32_64
10543#undef OPERAND_TYPE_IMM64_DISP64
10544
f3c180ae
AM
10545 };
10546 char *cp;
10547 unsigned int j;
10548
deea4973 10549#if defined (OBJ_MAYBE_ELF) && !defined (TE_PE)
718ddfc0
JB
10550 if (!IS_ELF)
10551 return NULL;
d382c579 10552#endif
718ddfc0 10553
f3c180ae 10554 for (cp = input_line_pointer; *cp != '@'; cp++)
67c11a9b 10555 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
f3c180ae
AM
10556 return NULL;
10557
47465058 10558 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
f3c180ae 10559 {
cff8d58a 10560 int len = gotrel[j].len;
28f81592 10561 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
f3c180ae 10562 {
4fa24527 10563 if (gotrel[j].rel[object_64bit] != 0)
f3c180ae 10564 {
28f81592
AM
10565 int first, second;
10566 char *tmpbuf, *past_reloc;
f3c180ae 10567
91d6fa6a 10568 *rel = gotrel[j].rel[object_64bit];
f3c180ae 10569
3956db08
JB
10570 if (types)
10571 {
10572 if (flag_code != CODE_64BIT)
40fb9820
L
10573 {
10574 types->bitfield.imm32 = 1;
10575 types->bitfield.disp32 = 1;
10576 }
3956db08
JB
10577 else
10578 *types = gotrel[j].types64;
10579 }
10580
844bf810 10581 if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
f3c180ae
AM
10582 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10583
28f81592 10584 /* The length of the first part of our input line. */
f3c180ae 10585 first = cp - input_line_pointer;
28f81592
AM
10586
10587 /* The second part goes from after the reloc token until
67c11a9b 10588 (and including) an end_of_line char or comma. */
28f81592 10589 past_reloc = cp + 1 + len;
67c11a9b
AM
10590 cp = past_reloc;
10591 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10592 ++cp;
10593 second = cp + 1 - past_reloc;
28f81592
AM
10594
10595 /* Allocate and copy string. The trailing NUL shouldn't
10596 be necessary, but be safe. */
add39d23 10597 tmpbuf = XNEWVEC (char, first + second + 2);
f3c180ae 10598 memcpy (tmpbuf, input_line_pointer, first);
0787a12d
AM
10599 if (second != 0 && *past_reloc != ' ')
10600 /* Replace the relocation token with ' ', so that
10601 errors like foo@GOTOFF1 will be detected. */
10602 tmpbuf[first++] = ' ';
af89796a
L
10603 else
10604 /* Increment length by 1 if the relocation token is
10605 removed. */
10606 len++;
10607 if (adjust)
10608 *adjust = len;
0787a12d
AM
10609 memcpy (tmpbuf + first, past_reloc, second);
10610 tmpbuf[first + second] = '\0';
f3c180ae
AM
10611 return tmpbuf;
10612 }
10613
4fa24527
JB
10614 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10615 gotrel[j].str, 1 << (5 + object_64bit));
f3c180ae
AM
10616 return NULL;
10617 }
10618 }
10619
10620 /* Might be a symbol version string. Don't as_bad here. */
10621 return NULL;
10622}
4e4f7c87 10623#endif
f3c180ae 10624
62ebcb5c 10625bfd_reloc_code_real_type
e3bb37b5 10626x86_cons (expressionS *exp, int size)
f3c180ae 10627{
62ebcb5c
AM
10628 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10629
2748c1b1
L
10630#if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
10631 && !defined (LEX_AT)) \
10632 || defined (TE_PE)
ee86248c
JB
10633 intel_syntax = -intel_syntax;
10634
3c7b9c2c 10635 exp->X_md = 0;
4fa24527 10636 if (size == 4 || (object_64bit && size == 8))
f3c180ae
AM
10637 {
10638 /* Handle @GOTOFF and the like in an expression. */
10639 char *save;
10640 char *gotfree_input_line;
4a57f2cf 10641 int adjust = 0;
f3c180ae
AM
10642
10643 save = input_line_pointer;
d258b828 10644 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
f3c180ae
AM
10645 if (gotfree_input_line)
10646 input_line_pointer = gotfree_input_line;
10647
10648 expression (exp);
10649
10650 if (gotfree_input_line)
10651 {
10652 /* expression () has merrily parsed up to the end of line,
10653 or a comma - in the wrong buffer. Transfer how far
10654 input_line_pointer has moved to the right buffer. */
10655 input_line_pointer = (save
10656 + (input_line_pointer - gotfree_input_line)
10657 + adjust);
10658 free (gotfree_input_line);
3992d3b7
AM
10659 if (exp->X_op == O_constant
10660 || exp->X_op == O_absent
10661 || exp->X_op == O_illegal
0398aac5 10662 || exp->X_op == O_register
3992d3b7
AM
10663 || exp->X_op == O_big)
10664 {
10665 char c = *input_line_pointer;
10666 *input_line_pointer = 0;
10667 as_bad (_("missing or invalid expression `%s'"), save);
10668 *input_line_pointer = c;
10669 }
b9519cfe
L
10670 else if ((got_reloc == BFD_RELOC_386_PLT32
10671 || got_reloc == BFD_RELOC_X86_64_PLT32)
10672 && exp->X_op != O_symbol)
10673 {
10674 char c = *input_line_pointer;
10675 *input_line_pointer = 0;
10676 as_bad (_("invalid PLT expression `%s'"), save);
10677 *input_line_pointer = c;
10678 }
f3c180ae
AM
10679 }
10680 }
10681 else
10682 expression (exp);
ee86248c
JB
10683
10684 intel_syntax = -intel_syntax;
10685
10686 if (intel_syntax)
10687 i386_intel_simplify (exp);
2748c1b1
L
10688#else
10689 expression (exp);
10690#endif
62ebcb5c 10691
a442cac5
JB
10692 /* If not 64bit, massage value, to account for wraparound when !BFD64. */
10693 if (size == 4 && exp->X_op == O_constant && !object_64bit)
10694 exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
10695
62ebcb5c 10696 return got_reloc;
f3c180ae 10697}
f3c180ae 10698
9f32dd5b
L
10699static void
10700signed_cons (int size)
6482c264 10701{
a442cac5 10702 if (object_64bit)
d182319b
JB
10703 cons_sign = 1;
10704 cons (size);
10705 cons_sign = -1;
6482c264
NC
10706}
10707
d182319b 10708#ifdef TE_PE
6482c264 10709static void
7016a5d5 10710pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
6482c264
NC
10711{
10712 expressionS exp;
10713
10714 do
10715 {
10716 expression (&exp);
10717 if (exp.X_op == O_symbol)
10718 exp.X_op = O_secrel;
10719
10720 emit_expr (&exp, 4);
10721 }
10722 while (*input_line_pointer++ == ',');
10723
10724 input_line_pointer--;
10725 demand_empty_rest_of_line ();
10726}
145667f8
MH
10727
10728static void
10729pe_directive_secidx (int dummy ATTRIBUTE_UNUSED)
10730{
10731 expressionS exp;
10732
10733 do
10734 {
10735 expression (&exp);
10736 if (exp.X_op == O_symbol)
10737 exp.X_op = O_secidx;
10738
10739 emit_expr (&exp, 2);
10740 }
10741 while (*input_line_pointer++ == ',');
10742
10743 input_line_pointer--;
10744 demand_empty_rest_of_line ();
10745}
6482c264
NC
10746#endif
10747
7063667e
JB
10748/* Handle Rounding Control / SAE specifiers. */
10749
10750static char *
10751RC_SAE_specifier (const char *pstr)
10752{
10753 unsigned int j;
10754
10755 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10756 {
10757 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10758 {
10759 if (i.rounding.type != rc_none)
10760 {
10761 as_bad (_("duplicated `{%s}'"), RC_NamesTable[j].name);
10762 return NULL;
10763 }
10764
10765 i.rounding.type = RC_NamesTable[j].type;
10766
10767 return (char *)(pstr + RC_NamesTable[j].len);
10768 }
10769 }
10770
10771 return NULL;
10772}
10773
43234a1e
L
10774/* Handle Vector operations. */
10775
10776static char *
f70c6814 10777check_VecOperations (char *op_string)
43234a1e
L
10778{
10779 const reg_entry *mask;
10780 const char *saved;
10781 char *end_op;
10782
f70c6814 10783 while (*op_string)
43234a1e
L
10784 {
10785 saved = op_string;
10786 if (*op_string == '{')
10787 {
10788 op_string++;
10789
10790 /* Check broadcasts. */
d34049e8 10791 if (startswith (op_string, "1to"))
43234a1e 10792 {
5273a3cd 10793 unsigned int bcst_type;
43234a1e 10794
5273a3cd 10795 if (i.broadcast.type)
43234a1e
L
10796 goto duplicated_vec_op;
10797
10798 op_string += 3;
10799 if (*op_string == '8')
8e6e0792 10800 bcst_type = 8;
b28d1bda 10801 else if (*op_string == '4')
8e6e0792 10802 bcst_type = 4;
b28d1bda 10803 else if (*op_string == '2')
8e6e0792 10804 bcst_type = 2;
43234a1e
L
10805 else if (*op_string == '1'
10806 && *(op_string+1) == '6')
10807 {
8e6e0792 10808 bcst_type = 16;
43234a1e
L
10809 op_string++;
10810 }
0cc78721
CL
10811 else if (*op_string == '3'
10812 && *(op_string+1) == '2')
10813 {
10814 bcst_type = 32;
10815 op_string++;
10816 }
43234a1e
L
10817 else
10818 {
10819 as_bad (_("Unsupported broadcast: `%s'"), saved);
10820 return NULL;
10821 }
10822 op_string++;
10823
5273a3cd
JB
10824 i.broadcast.type = bcst_type;
10825 i.broadcast.operand = this_operand;
43234a1e
L
10826 }
10827 /* Check masking operation. */
10828 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10829 {
8a6fb3f9
JB
10830 if (mask == &bad_reg)
10831 return NULL;
10832
43234a1e 10833 /* k0 can't be used for write mask. */
f74a6307 10834 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
43234a1e 10835 {
6d2cd6b2
JB
10836 as_bad (_("`%s%s' can't be used for write mask"),
10837 register_prefix, mask->reg_name);
43234a1e
L
10838 return NULL;
10839 }
10840
6225c532 10841 if (!i.mask.reg)
43234a1e 10842 {
6225c532
JB
10843 i.mask.reg = mask;
10844 i.mask.operand = this_operand;
43234a1e 10845 }
6225c532
JB
10846 else if (i.mask.reg->reg_num)
10847 goto duplicated_vec_op;
43234a1e
L
10848 else
10849 {
6225c532 10850 i.mask.reg = mask;
43234a1e
L
10851
10852 /* Only "{z}" is allowed here. No need to check
10853 zeroing mask explicitly. */
6225c532 10854 if (i.mask.operand != (unsigned int) this_operand)
43234a1e
L
10855 {
10856 as_bad (_("invalid write mask `%s'"), saved);
10857 return NULL;
10858 }
10859 }
10860
10861 op_string = end_op;
10862 }
10863 /* Check zeroing-flag for masking operation. */
10864 else if (*op_string == 'z')
10865 {
6225c532 10866 if (!i.mask.reg)
43234a1e 10867 {
6225c532
JB
10868 i.mask.reg = reg_k0;
10869 i.mask.zeroing = 1;
10870 i.mask.operand = this_operand;
43234a1e
L
10871 }
10872 else
10873 {
6225c532 10874 if (i.mask.zeroing)
43234a1e
L
10875 {
10876 duplicated_vec_op:
10877 as_bad (_("duplicated `%s'"), saved);
10878 return NULL;
10879 }
10880
6225c532 10881 i.mask.zeroing = 1;
43234a1e
L
10882
10883 /* Only "{%k}" is allowed here. No need to check mask
10884 register explicitly. */
6225c532 10885 if (i.mask.operand != (unsigned int) this_operand)
43234a1e
L
10886 {
10887 as_bad (_("invalid zeroing-masking `%s'"),
10888 saved);
10889 return NULL;
10890 }
10891 }
10892
10893 op_string++;
10894 }
7063667e
JB
10895 else if (intel_syntax
10896 && (op_string = RC_SAE_specifier (op_string)) != NULL)
10897 i.rounding.modifier = true;
43234a1e
L
10898 else
10899 goto unknown_vec_op;
10900
10901 if (*op_string != '}')
10902 {
10903 as_bad (_("missing `}' in `%s'"), saved);
10904 return NULL;
10905 }
10906 op_string++;
0ba3a731
L
10907
10908 /* Strip whitespace since the addition of pseudo prefixes
10909 changed how the scrubber treats '{'. */
10910 if (is_space_char (*op_string))
10911 ++op_string;
10912
43234a1e
L
10913 continue;
10914 }
10915 unknown_vec_op:
10916 /* We don't know this one. */
10917 as_bad (_("unknown vector operation: `%s'"), saved);
10918 return NULL;
10919 }
10920
6225c532 10921 if (i.mask.reg && i.mask.zeroing && !i.mask.reg->reg_num)
6d2cd6b2
JB
10922 {
10923 as_bad (_("zeroing-masking only allowed with write mask"));
10924 return NULL;
10925 }
10926
43234a1e
L
10927 return op_string;
10928}
10929
252b5132 10930static int
70e41ade 10931i386_immediate (char *imm_start)
252b5132
RH
10932{
10933 char *save_input_line_pointer;
f3c180ae 10934 char *gotfree_input_line;
252b5132 10935 segT exp_seg = 0;
47926f60 10936 expressionS *exp;
40fb9820
L
10937 i386_operand_type types;
10938
0dfbf9d7 10939 operand_type_set (&types, ~0);
252b5132
RH
10940
10941 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10942 {
31b2323c
L
10943 as_bad (_("at most %d immediate operands are allowed"),
10944 MAX_IMMEDIATE_OPERANDS);
252b5132
RH
10945 return 0;
10946 }
10947
10948 exp = &im_expressions[i.imm_operands++];
520dc8e8 10949 i.op[this_operand].imms = exp;
252b5132
RH
10950
10951 if (is_space_char (*imm_start))
10952 ++imm_start;
10953
10954 save_input_line_pointer = input_line_pointer;
10955 input_line_pointer = imm_start;
10956
d258b828 10957 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10958 if (gotfree_input_line)
10959 input_line_pointer = gotfree_input_line;
252b5132
RH
10960
10961 exp_seg = expression (exp);
10962
83183c0c 10963 SKIP_WHITESPACE ();
252b5132 10964 if (*input_line_pointer)
f3c180ae 10965 as_bad (_("junk `%s' after expression"), input_line_pointer);
252b5132
RH
10966
10967 input_line_pointer = save_input_line_pointer;
f3c180ae 10968 if (gotfree_input_line)
ee86248c
JB
10969 {
10970 free (gotfree_input_line);
10971
9aac24b1 10972 if (exp->X_op == O_constant)
ee86248c
JB
10973 exp->X_op = O_illegal;
10974 }
10975
9aac24b1
JB
10976 if (exp_seg == reg_section)
10977 {
10978 as_bad (_("illegal immediate register operand %s"), imm_start);
10979 return 0;
10980 }
10981
ee86248c
JB
10982 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10983}
252b5132 10984
ee86248c
JB
10985static int
10986i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10987 i386_operand_type types, const char *imm_start)
10988{
10989 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
252b5132 10990 {
313c53d1
L
10991 if (imm_start)
10992 as_bad (_("missing or invalid immediate expression `%s'"),
10993 imm_start);
3992d3b7 10994 return 0;
252b5132 10995 }
3e73aa7c 10996 else if (exp->X_op == O_constant)
252b5132 10997 {
47926f60 10998 /* Size it properly later. */
40fb9820 10999 i.types[this_operand].bitfield.imm64 = 1;
a442cac5
JB
11000
11001 /* If not 64bit, sign/zero extend val, to account for wraparound
11002 when !BFD64. */
11003 if (flag_code != CODE_64BIT)
11004 exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
252b5132 11005 }
4c63da97 11006#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
f86103b7 11007 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
31312f95 11008 && exp_seg != absolute_section
47926f60 11009 && exp_seg != text_section
24eab124
AM
11010 && exp_seg != data_section
11011 && exp_seg != bss_section
11012 && exp_seg != undefined_section
f86103b7 11013 && !bfd_is_com_section (exp_seg))
252b5132 11014 {
d0b47220 11015 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
252b5132
RH
11016 return 0;
11017 }
11018#endif
11019 else
11020 {
11021 /* This is an address. The size of the address will be
24eab124 11022 determined later, depending on destination register,
3e73aa7c 11023 suffix, or the default for the section. */
40fb9820
L
11024 i.types[this_operand].bitfield.imm8 = 1;
11025 i.types[this_operand].bitfield.imm16 = 1;
11026 i.types[this_operand].bitfield.imm32 = 1;
11027 i.types[this_operand].bitfield.imm32s = 1;
11028 i.types[this_operand].bitfield.imm64 = 1;
c6fb90c8
L
11029 i.types[this_operand] = operand_type_and (i.types[this_operand],
11030 types);
252b5132
RH
11031 }
11032
11033 return 1;
11034}
11035
551c1ca1 11036static char *
e3bb37b5 11037i386_scale (char *scale)
252b5132 11038{
551c1ca1
AM
11039 offsetT val;
11040 char *save = input_line_pointer;
252b5132 11041
551c1ca1
AM
11042 input_line_pointer = scale;
11043 val = get_absolute_expression ();
11044
11045 switch (val)
252b5132 11046 {
551c1ca1 11047 case 1:
252b5132
RH
11048 i.log2_scale_factor = 0;
11049 break;
551c1ca1 11050 case 2:
252b5132
RH
11051 i.log2_scale_factor = 1;
11052 break;
551c1ca1 11053 case 4:
252b5132
RH
11054 i.log2_scale_factor = 2;
11055 break;
551c1ca1 11056 case 8:
252b5132
RH
11057 i.log2_scale_factor = 3;
11058 break;
11059 default:
a724f0f4
JB
11060 {
11061 char sep = *input_line_pointer;
11062
11063 *input_line_pointer = '\0';
11064 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
11065 scale);
11066 *input_line_pointer = sep;
11067 input_line_pointer = save;
11068 return NULL;
11069 }
252b5132 11070 }
29b0f896 11071 if (i.log2_scale_factor != 0 && i.index_reg == 0)
252b5132
RH
11072 {
11073 as_warn (_("scale factor of %d without an index register"),
24eab124 11074 1 << i.log2_scale_factor);
252b5132 11075 i.log2_scale_factor = 0;
252b5132 11076 }
551c1ca1
AM
11077 scale = input_line_pointer;
11078 input_line_pointer = save;
11079 return scale;
252b5132
RH
11080}
11081
252b5132 11082static int
e3bb37b5 11083i386_displacement (char *disp_start, char *disp_end)
252b5132 11084{
29b0f896 11085 expressionS *exp;
252b5132
RH
11086 segT exp_seg = 0;
11087 char *save_input_line_pointer;
f3c180ae 11088 char *gotfree_input_line;
40fb9820
L
11089 int override;
11090 i386_operand_type bigdisp, types = anydisp;
3992d3b7 11091 int ret;
252b5132 11092
31b2323c
L
11093 if (i.disp_operands == MAX_MEMORY_OPERANDS)
11094 {
11095 as_bad (_("at most %d displacement operands are allowed"),
11096 MAX_MEMORY_OPERANDS);
11097 return 0;
11098 }
11099
0dfbf9d7 11100 operand_type_set (&bigdisp, 0);
6f2f06be 11101 if (i.jumpabsolute
48bcea9f 11102 || i.types[this_operand].bitfield.baseindex
0cfa3eb3
JB
11103 || (current_templates->start->opcode_modifier.jump != JUMP
11104 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
e05278af 11105 {
48bcea9f 11106 i386_addressing_mode ();
e05278af 11107 override = (i.prefix[ADDR_PREFIX] != 0);
40fb9820
L
11108 if (flag_code == CODE_64BIT)
11109 {
a775efc8 11110 bigdisp.bitfield.disp32 = 1;
40fb9820 11111 if (!override)
a775efc8 11112 bigdisp.bitfield.disp64 = 1;
40fb9820
L
11113 }
11114 else if ((flag_code == CODE_16BIT) ^ override)
40fb9820 11115 bigdisp.bitfield.disp16 = 1;
48bcea9f
JB
11116 else
11117 bigdisp.bitfield.disp32 = 1;
e05278af
JB
11118 }
11119 else
11120 {
376cd056
JB
11121 /* For PC-relative branches, the width of the displacement may be
11122 dependent upon data size, but is never dependent upon address size.
11123 Also make sure to not unintentionally match against a non-PC-relative
11124 branch template. */
11125 static templates aux_templates;
11126 const insn_template *t = current_templates->start;
5b7c81bd 11127 bool has_intel64 = false;
376cd056
JB
11128
11129 aux_templates.start = t;
11130 while (++t < current_templates->end)
11131 {
11132 if (t->opcode_modifier.jump
11133 != current_templates->start->opcode_modifier.jump)
11134 break;
4b5aaf5f 11135 if ((t->opcode_modifier.isa64 >= INTEL64))
5b7c81bd 11136 has_intel64 = true;
376cd056
JB
11137 }
11138 if (t < current_templates->end)
11139 {
11140 aux_templates.end = t;
11141 current_templates = &aux_templates;
11142 }
11143
e05278af 11144 override = (i.prefix[DATA_PREFIX] != 0);
40fb9820
L
11145 if (flag_code == CODE_64BIT)
11146 {
376cd056
JB
11147 if ((override || i.suffix == WORD_MNEM_SUFFIX)
11148 && (!intel64 || !has_intel64))
40fb9820
L
11149 bigdisp.bitfield.disp16 = 1;
11150 else
a775efc8 11151 bigdisp.bitfield.disp32 = 1;
40fb9820
L
11152 }
11153 else
e05278af
JB
11154 {
11155 if (!override)
11156 override = (i.suffix == (flag_code != CODE_16BIT
11157 ? WORD_MNEM_SUFFIX
11158 : LONG_MNEM_SUFFIX));
40fb9820
L
11159 bigdisp.bitfield.disp32 = 1;
11160 if ((flag_code == CODE_16BIT) ^ override)
11161 {
11162 bigdisp.bitfield.disp32 = 0;
11163 bigdisp.bitfield.disp16 = 1;
11164 }
e05278af 11165 }
e05278af 11166 }
c6fb90c8
L
11167 i.types[this_operand] = operand_type_or (i.types[this_operand],
11168 bigdisp);
252b5132
RH
11169
11170 exp = &disp_expressions[i.disp_operands];
520dc8e8 11171 i.op[this_operand].disps = exp;
252b5132
RH
11172 i.disp_operands++;
11173 save_input_line_pointer = input_line_pointer;
11174 input_line_pointer = disp_start;
11175 END_STRING_AND_SAVE (disp_end);
11176
11177#ifndef GCC_ASM_O_HACK
11178#define GCC_ASM_O_HACK 0
11179#endif
11180#if GCC_ASM_O_HACK
11181 END_STRING_AND_SAVE (disp_end + 1);
40fb9820 11182 if (i.types[this_operand].bitfield.baseIndex
24eab124 11183 && displacement_string_end[-1] == '+')
252b5132
RH
11184 {
11185 /* This hack is to avoid a warning when using the "o"
24eab124
AM
11186 constraint within gcc asm statements.
11187 For instance:
11188
11189 #define _set_tssldt_desc(n,addr,limit,type) \
11190 __asm__ __volatile__ ( \
11191 "movw %w2,%0\n\t" \
11192 "movw %w1,2+%0\n\t" \
11193 "rorl $16,%1\n\t" \
11194 "movb %b1,4+%0\n\t" \
11195 "movb %4,5+%0\n\t" \
11196 "movb $0,6+%0\n\t" \
11197 "movb %h1,7+%0\n\t" \
11198 "rorl $16,%1" \
11199 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
11200
11201 This works great except that the output assembler ends
11202 up looking a bit weird if it turns out that there is
11203 no offset. You end up producing code that looks like:
11204
11205 #APP
11206 movw $235,(%eax)
11207 movw %dx,2+(%eax)
11208 rorl $16,%edx
11209 movb %dl,4+(%eax)
11210 movb $137,5+(%eax)
11211 movb $0,6+(%eax)
11212 movb %dh,7+(%eax)
11213 rorl $16,%edx
11214 #NO_APP
11215
47926f60 11216 So here we provide the missing zero. */
24eab124
AM
11217
11218 *displacement_string_end = '0';
252b5132
RH
11219 }
11220#endif
d258b828 11221 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
11222 if (gotfree_input_line)
11223 input_line_pointer = gotfree_input_line;
252b5132 11224
24eab124 11225 exp_seg = expression (exp);
252b5132 11226
636c26b0
AM
11227 SKIP_WHITESPACE ();
11228 if (*input_line_pointer)
11229 as_bad (_("junk `%s' after expression"), input_line_pointer);
11230#if GCC_ASM_O_HACK
11231 RESTORE_END_STRING (disp_end + 1);
11232#endif
636c26b0 11233 input_line_pointer = save_input_line_pointer;
636c26b0 11234 if (gotfree_input_line)
ee86248c
JB
11235 {
11236 free (gotfree_input_line);
11237
11238 if (exp->X_op == O_constant || exp->X_op == O_register)
11239 exp->X_op = O_illegal;
11240 }
11241
11242 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
11243
11244 RESTORE_END_STRING (disp_end);
11245
11246 return ret;
11247}
11248
11249static int
11250i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
11251 i386_operand_type types, const char *disp_start)
11252{
ee86248c 11253 int ret = 1;
636c26b0 11254
24eab124
AM
11255 /* We do this to make sure that the section symbol is in
11256 the symbol table. We will ultimately change the relocation
47926f60 11257 to be relative to the beginning of the section. */
1ae12ab7 11258 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
d6ab8113
JB
11259 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
11260 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
24eab124 11261 {
636c26b0 11262 if (exp->X_op != O_symbol)
3992d3b7 11263 goto inv_disp;
636c26b0 11264
e5cb08ac 11265 if (S_IS_LOCAL (exp->X_add_symbol)
c64efb4b
L
11266 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
11267 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
24eab124 11268 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
24eab124
AM
11269 exp->X_op = O_subtract;
11270 exp->X_op_symbol = GOT_symbol;
1ae12ab7 11271 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
29b0f896 11272 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
d6ab8113
JB
11273 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
11274 i.reloc[this_operand] = BFD_RELOC_64;
23df1078 11275 else
29b0f896 11276 i.reloc[this_operand] = BFD_RELOC_32;
24eab124 11277 }
252b5132 11278
3992d3b7
AM
11279 else if (exp->X_op == O_absent
11280 || exp->X_op == O_illegal
ee86248c 11281 || exp->X_op == O_big)
2daf4fd8 11282 {
3992d3b7
AM
11283 inv_disp:
11284 as_bad (_("missing or invalid displacement expression `%s'"),
2daf4fd8 11285 disp_start);
3992d3b7 11286 ret = 0;
2daf4fd8
AM
11287 }
11288
a50187b2
JB
11289 else if (exp->X_op == O_constant)
11290 {
11291 /* Sizing gets taken care of by optimize_disp().
11292
11293 If not 64bit, sign/zero extend val, to account for wraparound
11294 when !BFD64. */
11295 if (flag_code != CODE_64BIT)
11296 exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
11297 }
11298
4c63da97 11299#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
a50187b2 11300 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
3992d3b7
AM
11301 && exp_seg != absolute_section
11302 && exp_seg != text_section
11303 && exp_seg != data_section
11304 && exp_seg != bss_section
11305 && exp_seg != undefined_section
11306 && !bfd_is_com_section (exp_seg))
24eab124 11307 {
d0b47220 11308 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
3992d3b7 11309 ret = 0;
24eab124 11310 }
252b5132 11311#endif
3956db08 11312
a50187b2 11313 else if (current_templates->start->opcode_modifier.jump == JUMP_BYTE)
48bcea9f
JB
11314 i.types[this_operand].bitfield.disp8 = 1;
11315
40fb9820 11316 /* Check if this is a displacement only operand. */
02b83698
JB
11317 if (!i.types[this_operand].bitfield.baseindex)
11318 i.types[this_operand] =
11319 operand_type_or (operand_type_and_not (i.types[this_operand], anydisp),
11320 operand_type_and (i.types[this_operand], types));
3956db08 11321
3992d3b7 11322 return ret;
252b5132
RH
11323}
11324
2abc2bec
JB
11325/* Return the active addressing mode, taking address override and
11326 registers forming the address into consideration. Update the
11327 address override prefix if necessary. */
47926f60 11328
2abc2bec
JB
11329static enum flag_code
11330i386_addressing_mode (void)
252b5132 11331{
be05d201
L
11332 enum flag_code addr_mode;
11333
11334 if (i.prefix[ADDR_PREFIX])
11335 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
a23b33b3
JB
11336 else if (flag_code == CODE_16BIT
11337 && current_templates->start->cpu_flags.bitfield.cpumpx
11338 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
11339 from md_assemble() by "is not a valid base/index expression"
11340 when there is a base and/or index. */
11341 && !i.types[this_operand].bitfield.baseindex)
11342 {
11343 /* MPX insn memory operands with neither base nor index must be forced
11344 to use 32-bit addressing in 16-bit mode. */
11345 addr_mode = CODE_32BIT;
11346 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11347 ++i.prefixes;
11348 gas_assert (!i.types[this_operand].bitfield.disp16);
11349 gas_assert (!i.types[this_operand].bitfield.disp32);
11350 }
be05d201
L
11351 else
11352 {
11353 addr_mode = flag_code;
11354
24eab124 11355#if INFER_ADDR_PREFIX
be05d201
L
11356 if (i.mem_operands == 0)
11357 {
11358 /* Infer address prefix from the first memory operand. */
11359 const reg_entry *addr_reg = i.base_reg;
11360
11361 if (addr_reg == NULL)
11362 addr_reg = i.index_reg;
eecb386c 11363
be05d201
L
11364 if (addr_reg)
11365 {
e968fc9b 11366 if (addr_reg->reg_type.bitfield.dword)
be05d201
L
11367 addr_mode = CODE_32BIT;
11368 else if (flag_code != CODE_64BIT
dc821c5f 11369 && addr_reg->reg_type.bitfield.word)
be05d201
L
11370 addr_mode = CODE_16BIT;
11371
11372 if (addr_mode != flag_code)
11373 {
11374 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11375 i.prefixes += 1;
11376 /* Change the size of any displacement too. At most one
11377 of Disp16 or Disp32 is set.
11378 FIXME. There doesn't seem to be any real need for
11379 separate Disp16 and Disp32 flags. The same goes for
11380 Imm16 and Imm32. Removing them would probably clean
11381 up the code quite a lot. */
11382 if (flag_code != CODE_64BIT
11383 && (i.types[this_operand].bitfield.disp16
11384 || i.types[this_operand].bitfield.disp32))
05909f23
JB
11385 {
11386 static const i386_operand_type disp16_32 = {
11387 .bitfield = { .disp16 = 1, .disp32 = 1 }
11388 };
11389
11390 i.types[this_operand]
11391 = operand_type_xor (i.types[this_operand], disp16_32);
11392 }
be05d201
L
11393 }
11394 }
11395 }
24eab124 11396#endif
be05d201
L
11397 }
11398
2abc2bec
JB
11399 return addr_mode;
11400}
11401
11402/* Make sure the memory operand we've been dealt is valid.
11403 Return 1 on success, 0 on a failure. */
11404
11405static int
11406i386_index_check (const char *operand_string)
11407{
11408 const char *kind = "base/index";
11409 enum flag_code addr_mode = i386_addressing_mode ();
77a19f0e 11410 const insn_template *t = current_templates->end - 1;
2abc2bec 11411
77a19f0e 11412 if (t->opcode_modifier.isstring)
fc0763e6
JB
11413 {
11414 /* Memory operands of string insns are special in that they only allow
11415 a single register (rDI, rSI, or rBX) as their memory address. */
be05d201
L
11416 const reg_entry *expected_reg;
11417 static const char *di_si[][2] =
11418 {
11419 { "esi", "edi" },
11420 { "si", "di" },
11421 { "rsi", "rdi" }
11422 };
11423 static const char *bx[] = { "ebx", "bx", "rbx" };
fc0763e6
JB
11424
11425 kind = "string address";
11426
a152332d 11427 if (t->opcode_modifier.prefixok == PrefixRep)
fc0763e6 11428 {
77a19f0e 11429 int es_op = t->opcode_modifier.isstring - IS_STRING_ES_OP0;
51c8edf6 11430 int op = 0;
fc0763e6 11431
77a19f0e 11432 if (!t->operand_types[0].bitfield.baseindex
fc0763e6 11433 || ((!i.mem_operands != !intel_syntax)
77a19f0e 11434 && t->operand_types[1].bitfield.baseindex))
51c8edf6 11435 op = 1;
fe0e921f
AM
11436 expected_reg
11437 = (const reg_entry *) str_hash_find (reg_hash,
11438 di_si[addr_mode][op == es_op]);
fc0763e6
JB
11439 }
11440 else
fe0e921f
AM
11441 expected_reg
11442 = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
fc0763e6 11443
be05d201
L
11444 if (i.base_reg != expected_reg
11445 || i.index_reg
fc0763e6 11446 || operand_type_check (i.types[this_operand], disp))
fc0763e6 11447 {
be05d201
L
11448 /* The second memory operand must have the same size as
11449 the first one. */
11450 if (i.mem_operands
11451 && i.base_reg
11452 && !((addr_mode == CODE_64BIT
dc821c5f 11453 && i.base_reg->reg_type.bitfield.qword)
be05d201 11454 || (addr_mode == CODE_32BIT
dc821c5f
JB
11455 ? i.base_reg->reg_type.bitfield.dword
11456 : i.base_reg->reg_type.bitfield.word)))
be05d201
L
11457 goto bad_address;
11458
fc0763e6
JB
11459 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11460 operand_string,
11461 intel_syntax ? '[' : '(',
11462 register_prefix,
be05d201 11463 expected_reg->reg_name,
fc0763e6 11464 intel_syntax ? ']' : ')');
be05d201 11465 return 1;
fc0763e6 11466 }
be05d201
L
11467 else
11468 return 1;
11469
dc1e8a47 11470 bad_address:
be05d201
L
11471 as_bad (_("`%s' is not a valid %s expression"),
11472 operand_string, kind);
11473 return 0;
3e73aa7c
JH
11474 }
11475 else
11476 {
77a19f0e
JB
11477 t = current_templates->start;
11478
be05d201
L
11479 if (addr_mode != CODE_16BIT)
11480 {
11481 /* 32-bit/64-bit checks. */
41eb8e88
L
11482 if (i.disp_encoding == disp_encoding_16bit)
11483 {
11484 bad_disp:
11485 as_bad (_("invalid `%s' prefix"),
11486 addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11487 return 0;
11488 }
11489
be05d201 11490 if ((i.base_reg
e968fc9b
JB
11491 && ((addr_mode == CODE_64BIT
11492 ? !i.base_reg->reg_type.bitfield.qword
11493 : !i.base_reg->reg_type.bitfield.dword)
11494 || (i.index_reg && i.base_reg->reg_num == RegIP)
11495 || i.base_reg->reg_num == RegIZ))
be05d201 11496 || (i.index_reg
1b54b8d7
JB
11497 && !i.index_reg->reg_type.bitfield.xmmword
11498 && !i.index_reg->reg_type.bitfield.ymmword
11499 && !i.index_reg->reg_type.bitfield.zmmword
be05d201 11500 && ((addr_mode == CODE_64BIT
e968fc9b
JB
11501 ? !i.index_reg->reg_type.bitfield.qword
11502 : !i.index_reg->reg_type.bitfield.dword)
be05d201
L
11503 || !i.index_reg->reg_type.bitfield.baseindex)))
11504 goto bad_address;
8178be5b 11505
260cd341 11506 /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
7fc69528
JB
11507 if (t->mnem_off == MN_bndmk
11508 || t->mnem_off == MN_bndldx
11509 || t->mnem_off == MN_bndstx
a152332d 11510 || t->opcode_modifier.sib == SIBMEM)
8178be5b
JB
11511 {
11512 /* They cannot use RIP-relative addressing. */
e968fc9b 11513 if (i.base_reg && i.base_reg->reg_num == RegIP)
8178be5b
JB
11514 {
11515 as_bad (_("`%s' cannot be used here"), operand_string);
11516 return 0;
11517 }
11518
11519 /* bndldx and bndstx ignore their scale factor. */
7fc69528 11520 if ((t->mnem_off == MN_bndldx || t->mnem_off == MN_bndstx)
8178be5b
JB
11521 && i.log2_scale_factor)
11522 as_warn (_("register scaling is being ignored here"));
11523 }
be05d201
L
11524 }
11525 else
3e73aa7c 11526 {
be05d201 11527 /* 16-bit checks. */
41eb8e88
L
11528 if (i.disp_encoding == disp_encoding_32bit)
11529 goto bad_disp;
11530
3e73aa7c 11531 if ((i.base_reg
dc821c5f 11532 && (!i.base_reg->reg_type.bitfield.word
40fb9820 11533 || !i.base_reg->reg_type.bitfield.baseindex))
3e73aa7c 11534 || (i.index_reg
dc821c5f 11535 && (!i.index_reg->reg_type.bitfield.word
40fb9820 11536 || !i.index_reg->reg_type.bitfield.baseindex
29b0f896
AM
11537 || !(i.base_reg
11538 && i.base_reg->reg_num < 6
11539 && i.index_reg->reg_num >= 6
11540 && i.log2_scale_factor == 0))))
be05d201 11541 goto bad_address;
3e73aa7c
JH
11542 }
11543 }
be05d201 11544 return 1;
24eab124 11545}
252b5132 11546
43234a1e
L
11547/* Handle vector immediates. */
11548
11549static int
11550RC_SAE_immediate (const char *imm_start)
11551{
43234a1e 11552 const char *pstr = imm_start;
43234a1e
L
11553
11554 if (*pstr != '{')
11555 return 0;
11556
7063667e
JB
11557 pstr = RC_SAE_specifier (pstr + 1);
11558 if (pstr == NULL)
43234a1e
L
11559 return 0;
11560
11561 if (*pstr++ != '}')
11562 {
11563 as_bad (_("Missing '}': '%s'"), imm_start);
11564 return 0;
11565 }
11566 /* RC/SAE immediate string should contain nothing more. */;
11567 if (*pstr != 0)
11568 {
11569 as_bad (_("Junk after '}': '%s'"), imm_start);
11570 return 0;
11571 }
11572
cf665fee
JB
11573 /* Internally this doesn't count as an operand. */
11574 --i.operands;
43234a1e 11575
43234a1e
L
11576 return 1;
11577}
11578
9d299bea
JB
11579static INLINE bool starts_memory_operand (char c)
11580{
014fbcda 11581 return ISDIGIT (c)
9d299bea 11582 || is_identifier_char (c)
014fbcda 11583 || strchr ("([\"+-!~", c);
9d299bea
JB
11584}
11585
fc0763e6 11586/* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
47926f60 11587 on error. */
252b5132 11588
252b5132 11589static int
a7619375 11590i386_att_operand (char *operand_string)
252b5132 11591{
af6bdddf
AM
11592 const reg_entry *r;
11593 char *end_op;
24eab124 11594 char *op_string = operand_string;
252b5132 11595
24eab124 11596 if (is_space_char (*op_string))
252b5132
RH
11597 ++op_string;
11598
24eab124 11599 /* We check for an absolute prefix (differentiating,
47926f60 11600 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
24eab124
AM
11601 if (*op_string == ABSOLUTE_PREFIX)
11602 {
11603 ++op_string;
11604 if (is_space_char (*op_string))
11605 ++op_string;
5b7c81bd 11606 i.jumpabsolute = true;
24eab124 11607 }
252b5132 11608
47926f60 11609 /* Check if operand is a register. */
4d1bb795 11610 if ((r = parse_register (op_string, &end_op)) != NULL)
24eab124 11611 {
40fb9820
L
11612 i386_operand_type temp;
11613
8a6fb3f9
JB
11614 if (r == &bad_reg)
11615 return 0;
11616
24eab124
AM
11617 /* Check for a segment override by searching for ':' after a
11618 segment register. */
11619 op_string = end_op;
11620 if (is_space_char (*op_string))
11621 ++op_string;
00cee14f 11622 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
24eab124 11623 {
5e042380 11624 i.seg[i.mem_operands] = r;
252b5132 11625
24eab124 11626 /* Skip the ':' and whitespace. */
252b5132
RH
11627 ++op_string;
11628 if (is_space_char (*op_string))
24eab124 11629 ++op_string;
252b5132 11630
47926f60 11631 /* Handle case of %es:*foo. */
c8d541e2 11632 if (!i.jumpabsolute && *op_string == ABSOLUTE_PREFIX)
24eab124
AM
11633 {
11634 ++op_string;
11635 if (is_space_char (*op_string))
11636 ++op_string;
5b7c81bd 11637 i.jumpabsolute = true;
24eab124 11638 }
c8d541e2 11639
9d299bea 11640 if (!starts_memory_operand (*op_string))
c8d541e2
JB
11641 {
11642 as_bad (_("bad memory operand `%s'"), op_string);
11643 return 0;
11644 }
24eab124
AM
11645 goto do_memory_reference;
11646 }
43234a1e
L
11647
11648 /* Handle vector operations. */
11649 if (*op_string == '{')
11650 {
f70c6814 11651 op_string = check_VecOperations (op_string);
43234a1e
L
11652 if (op_string == NULL)
11653 return 0;
11654 }
11655
24eab124
AM
11656 if (*op_string)
11657 {
d0b47220 11658 as_bad (_("junk `%s' after register"), op_string);
24eab124
AM
11659 return 0;
11660 }
40fb9820
L
11661 temp = r->reg_type;
11662 temp.bitfield.baseindex = 0;
c6fb90c8
L
11663 i.types[this_operand] = operand_type_or (i.types[this_operand],
11664 temp);
7d5e4556 11665 i.types[this_operand].bitfield.unspecified = 0;
520dc8e8 11666 i.op[this_operand].regs = r;
24eab124 11667 i.reg_operands++;
cf665fee
JB
11668
11669 /* A GPR may follow an RC or SAE immediate only if a (vector) register
11670 operand was also present earlier on. */
11671 if (i.rounding.type != rc_none && temp.bitfield.class == Reg
11672 && i.reg_operands == 1)
11673 {
11674 unsigned int j;
11675
11676 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); ++j)
11677 if (i.rounding.type == RC_NamesTable[j].type)
11678 break;
11679 as_bad (_("`%s': misplaced `{%s}'"),
76d3f746 11680 insn_name (current_templates->start), RC_NamesTable[j].name);
cf665fee
JB
11681 return 0;
11682 }
24eab124 11683 }
af6bdddf
AM
11684 else if (*op_string == REGISTER_PREFIX)
11685 {
11686 as_bad (_("bad register name `%s'"), op_string);
11687 return 0;
11688 }
24eab124 11689 else if (*op_string == IMMEDIATE_PREFIX)
ce8a8b2f 11690 {
24eab124 11691 ++op_string;
6f2f06be 11692 if (i.jumpabsolute)
24eab124 11693 {
d0b47220 11694 as_bad (_("immediate operand illegal with absolute jump"));
24eab124
AM
11695 return 0;
11696 }
11697 if (!i386_immediate (op_string))
11698 return 0;
cf665fee
JB
11699 if (i.rounding.type != rc_none)
11700 {
11701 as_bad (_("`%s': RC/SAE operand must follow immediate operands"),
76d3f746 11702 insn_name (current_templates->start));
cf665fee
JB
11703 return 0;
11704 }
24eab124 11705 }
43234a1e
L
11706 else if (RC_SAE_immediate (operand_string))
11707 {
cf665fee
JB
11708 /* If it is a RC or SAE immediate, do the necessary placement check:
11709 Only another immediate or a GPR may precede it. */
11710 if (i.mem_operands || i.reg_operands + i.imm_operands > 1
11711 || (i.reg_operands == 1
11712 && i.op[0].regs->reg_type.bitfield.class != Reg))
11713 {
11714 as_bad (_("`%s': misplaced `%s'"),
76d3f746 11715 insn_name (current_templates->start), operand_string);
cf665fee
JB
11716 return 0;
11717 }
43234a1e 11718 }
9d299bea 11719 else if (starts_memory_operand (*op_string))
24eab124 11720 {
47926f60 11721 /* This is a memory reference of some sort. */
af6bdddf 11722 char *base_string;
252b5132 11723
47926f60 11724 /* Start and end of displacement string expression (if found). */
eecb386c
AM
11725 char *displacement_string_start;
11726 char *displacement_string_end;
252b5132 11727
24eab124 11728 do_memory_reference:
24eab124
AM
11729 /* Check for base index form. We detect the base index form by
11730 looking for an ')' at the end of the operand, searching
11731 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11732 after the '('. */
af6bdddf 11733 base_string = op_string + strlen (op_string);
c3332e24 11734
43234a1e 11735 /* Handle vector operations. */
6b5ba0d4
JB
11736 --base_string;
11737 if (is_space_char (*base_string))
11738 --base_string;
11739
11740 if (*base_string == '}')
43234a1e 11741 {
6b5ba0d4
JB
11742 char *vop_start = NULL;
11743
11744 while (base_string-- > op_string)
11745 {
11746 if (*base_string == '"')
11747 break;
11748 if (*base_string != '{')
11749 continue;
11750
11751 vop_start = base_string;
11752
11753 --base_string;
11754 if (is_space_char (*base_string))
11755 --base_string;
11756
11757 if (*base_string != '}')
11758 break;
11759
11760 vop_start = NULL;
11761 }
11762
11763 if (!vop_start)
11764 {
11765 as_bad (_("unbalanced figure braces"));
11766 return 0;
11767 }
11768
f70c6814 11769 if (check_VecOperations (vop_start) == NULL)
43234a1e 11770 return 0;
43234a1e
L
11771 }
11772
47926f60 11773 /* If we only have a displacement, set-up for it to be parsed later. */
af6bdddf
AM
11774 displacement_string_start = op_string;
11775 displacement_string_end = base_string + 1;
252b5132 11776
24eab124
AM
11777 if (*base_string == ')')
11778 {
af6bdddf 11779 char *temp_string;
e87fb6a6
JB
11780 unsigned int parens_not_balanced = 0;
11781 bool in_quotes = false;
e68c3d59 11782
24eab124 11783 /* We've already checked that the number of left & right ()'s are
e87fb6a6
JB
11784 equal, and that there's a matching set of double quotes. */
11785 end_op = base_string;
11786 for (temp_string = op_string; temp_string < end_op; temp_string++)
24eab124 11787 {
e87fb6a6
JB
11788 if (*temp_string == '\\' && temp_string[1] == '"')
11789 ++temp_string;
11790 else if (*temp_string == '"')
11791 in_quotes = !in_quotes;
11792 else if (!in_quotes)
11793 {
11794 if (*temp_string == '(' && !parens_not_balanced++)
11795 base_string = temp_string;
11796 if (*temp_string == ')')
11797 --parens_not_balanced;
11798 }
24eab124 11799 }
c3332e24 11800
af6bdddf 11801 temp_string = base_string;
c3332e24 11802
24eab124 11803 /* Skip past '(' and whitespace. */
e87fb6a6
JB
11804 gas_assert (*base_string == '(');
11805 ++base_string;
252b5132 11806 if (is_space_char (*base_string))
24eab124 11807 ++base_string;
252b5132 11808
af6bdddf 11809 if (*base_string == ','
4eed87de
AM
11810 || ((i.base_reg = parse_register (base_string, &end_op))
11811 != NULL))
252b5132 11812 {
af6bdddf 11813 displacement_string_end = temp_string;
252b5132 11814
40fb9820 11815 i.types[this_operand].bitfield.baseindex = 1;
252b5132 11816
af6bdddf 11817 if (i.base_reg)
24eab124 11818 {
8a6fb3f9
JB
11819 if (i.base_reg == &bad_reg)
11820 return 0;
24eab124
AM
11821 base_string = end_op;
11822 if (is_space_char (*base_string))
11823 ++base_string;
af6bdddf
AM
11824 }
11825
11826 /* There may be an index reg or scale factor here. */
11827 if (*base_string == ',')
11828 {
11829 ++base_string;
11830 if (is_space_char (*base_string))
11831 ++base_string;
11832
4eed87de
AM
11833 if ((i.index_reg = parse_register (base_string, &end_op))
11834 != NULL)
24eab124 11835 {
8a6fb3f9
JB
11836 if (i.index_reg == &bad_reg)
11837 return 0;
af6bdddf 11838 base_string = end_op;
24eab124
AM
11839 if (is_space_char (*base_string))
11840 ++base_string;
af6bdddf
AM
11841 if (*base_string == ',')
11842 {
11843 ++base_string;
11844 if (is_space_char (*base_string))
11845 ++base_string;
11846 }
e5cb08ac 11847 else if (*base_string != ')')
af6bdddf 11848 {
4eed87de
AM
11849 as_bad (_("expecting `,' or `)' "
11850 "after index register in `%s'"),
af6bdddf
AM
11851 operand_string);
11852 return 0;
11853 }
24eab124 11854 }
af6bdddf 11855 else if (*base_string == REGISTER_PREFIX)
24eab124 11856 {
f76bf5e0
L
11857 end_op = strchr (base_string, ',');
11858 if (end_op)
11859 *end_op = '\0';
af6bdddf 11860 as_bad (_("bad register name `%s'"), base_string);
24eab124
AM
11861 return 0;
11862 }
252b5132 11863
47926f60 11864 /* Check for scale factor. */
551c1ca1 11865 if (*base_string != ')')
af6bdddf 11866 {
551c1ca1
AM
11867 char *end_scale = i386_scale (base_string);
11868
11869 if (!end_scale)
af6bdddf 11870 return 0;
24eab124 11871
551c1ca1 11872 base_string = end_scale;
af6bdddf
AM
11873 if (is_space_char (*base_string))
11874 ++base_string;
11875 if (*base_string != ')')
11876 {
4eed87de
AM
11877 as_bad (_("expecting `)' "
11878 "after scale factor in `%s'"),
af6bdddf
AM
11879 operand_string);
11880 return 0;
11881 }
11882 }
11883 else if (!i.index_reg)
24eab124 11884 {
4eed87de
AM
11885 as_bad (_("expecting index register or scale factor "
11886 "after `,'; got '%c'"),
af6bdddf 11887 *base_string);
24eab124
AM
11888 return 0;
11889 }
11890 }
af6bdddf 11891 else if (*base_string != ')')
24eab124 11892 {
4eed87de
AM
11893 as_bad (_("expecting `,' or `)' "
11894 "after base register in `%s'"),
af6bdddf 11895 operand_string);
24eab124
AM
11896 return 0;
11897 }
c3332e24 11898 }
af6bdddf 11899 else if (*base_string == REGISTER_PREFIX)
c3332e24 11900 {
f76bf5e0
L
11901 end_op = strchr (base_string, ',');
11902 if (end_op)
11903 *end_op = '\0';
af6bdddf 11904 as_bad (_("bad register name `%s'"), base_string);
24eab124 11905 return 0;
c3332e24 11906 }
24eab124
AM
11907 }
11908
11909 /* If there's an expression beginning the operand, parse it,
11910 assuming displacement_string_start and
11911 displacement_string_end are meaningful. */
11912 if (displacement_string_start != displacement_string_end)
11913 {
11914 if (!i386_displacement (displacement_string_start,
11915 displacement_string_end))
11916 return 0;
11917 }
11918
11919 /* Special case for (%dx) while doing input/output op. */
11920 if (i.base_reg
75e5731b
JB
11921 && i.base_reg->reg_type.bitfield.instance == RegD
11922 && i.base_reg->reg_type.bitfield.word
24eab124
AM
11923 && i.index_reg == 0
11924 && i.log2_scale_factor == 0
11925 && i.seg[i.mem_operands] == 0
40fb9820 11926 && !operand_type_check (i.types[this_operand], disp))
24eab124 11927 {
2fb5be8d 11928 i.types[this_operand] = i.base_reg->reg_type;
9373f275 11929 i.input_output_operand = true;
24eab124
AM
11930 return 1;
11931 }
11932
eecb386c
AM
11933 if (i386_index_check (operand_string) == 0)
11934 return 0;
c48dadc9 11935 i.flags[this_operand] |= Operand_Mem;
24eab124
AM
11936 i.mem_operands++;
11937 }
11938 else
ce8a8b2f
AM
11939 {
11940 /* It's not a memory operand; argh! */
24eab124
AM
11941 as_bad (_("invalid char %s beginning operand %d `%s'"),
11942 output_invalid (*op_string),
11943 this_operand + 1,
11944 op_string);
11945 return 0;
11946 }
47926f60 11947 return 1; /* Normal return. */
252b5132
RH
11948}
11949\f
fa94de6b
RM
11950/* Calculate the maximum variable size (i.e., excluding fr_fix)
11951 that an rs_machine_dependent frag may reach. */
11952
11953unsigned int
11954i386_frag_max_var (fragS *frag)
11955{
11956 /* The only relaxable frags are for jumps.
11957 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11958 gas_assert (frag->fr_type == rs_machine_dependent);
11959 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11960}
11961
b084df0b
L
11962#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11963static int
8dcea932 11964elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
b084df0b
L
11965{
11966 /* STT_GNU_IFUNC symbol must go through PLT. */
11967 if ((symbol_get_bfdsym (fr_symbol)->flags
11968 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11969 return 0;
11970
11971 if (!S_IS_EXTERNAL (fr_symbol))
11972 /* Symbol may be weak or local. */
11973 return !S_IS_WEAK (fr_symbol);
11974
8dcea932
L
11975 /* Global symbols with non-default visibility can't be preempted. */
11976 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11977 return 1;
11978
11979 if (fr_var != NO_RELOC)
11980 switch ((enum bfd_reloc_code_real) fr_var)
11981 {
11982 case BFD_RELOC_386_PLT32:
11983 case BFD_RELOC_X86_64_PLT32:
33eaf5de 11984 /* Symbol with PLT relocation may be preempted. */
8dcea932
L
11985 return 0;
11986 default:
11987 abort ();
11988 }
11989
b084df0b
L
11990 /* Global symbols with default visibility in a shared library may be
11991 preempted by another definition. */
8dcea932 11992 return !shared;
b084df0b
L
11993}
11994#endif
11995
79d72f45
HL
11996/* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11997 Note also work for Skylake and Cascadelake.
11998---------------------------------------------------------------------
11999| JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
12000| ------ | ----------- | ------- | -------- |
12001| Jo | N | N | Y |
12002| Jno | N | N | Y |
12003| Jc/Jb | Y | N | Y |
12004| Jae/Jnb | Y | N | Y |
12005| Je/Jz | Y | Y | Y |
12006| Jne/Jnz | Y | Y | Y |
12007| Jna/Jbe | Y | N | Y |
12008| Ja/Jnbe | Y | N | Y |
12009| Js | N | N | Y |
12010| Jns | N | N | Y |
12011| Jp/Jpe | N | N | Y |
12012| Jnp/Jpo | N | N | Y |
12013| Jl/Jnge | Y | Y | Y |
12014| Jge/Jnl | Y | Y | Y |
12015| Jle/Jng | Y | Y | Y |
12016| Jg/Jnle | Y | Y | Y |
12017--------------------------------------------------------------------- */
12018static int
12019i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
12020{
12021 if (mf_cmp == mf_cmp_alu_cmp)
12022 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
12023 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
12024 if (mf_cmp == mf_cmp_incdec)
12025 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
12026 || mf_jcc == mf_jcc_jle);
12027 if (mf_cmp == mf_cmp_test_and)
12028 return 1;
12029 return 0;
12030}
12031
e379e5f3
L
12032/* Return the next non-empty frag. */
12033
12034static fragS *
12035i386_next_non_empty_frag (fragS *fragP)
12036{
12037 /* There may be a frag with a ".fill 0" when there is no room in
12038 the current frag for frag_grow in output_insn. */
12039 for (fragP = fragP->fr_next;
12040 (fragP != NULL
12041 && fragP->fr_type == rs_fill
12042 && fragP->fr_fix == 0);
12043 fragP = fragP->fr_next)
12044 ;
12045 return fragP;
12046}
12047
12048/* Return the next jcc frag after BRANCH_PADDING. */
12049
12050static fragS *
79d72f45 12051i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
e379e5f3 12052{
79d72f45
HL
12053 fragS *branch_fragP;
12054 if (!pad_fragP)
e379e5f3
L
12055 return NULL;
12056
79d72f45
HL
12057 if (pad_fragP->fr_type == rs_machine_dependent
12058 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
e379e5f3
L
12059 == BRANCH_PADDING))
12060 {
79d72f45
HL
12061 branch_fragP = i386_next_non_empty_frag (pad_fragP);
12062 if (branch_fragP->fr_type != rs_machine_dependent)
e379e5f3 12063 return NULL;
79d72f45
HL
12064 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
12065 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
12066 pad_fragP->tc_frag_data.mf_type))
12067 return branch_fragP;
e379e5f3
L
12068 }
12069
12070 return NULL;
12071}
12072
12073/* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
12074
12075static void
12076i386_classify_machine_dependent_frag (fragS *fragP)
12077{
12078 fragS *cmp_fragP;
12079 fragS *pad_fragP;
12080 fragS *branch_fragP;
12081 fragS *next_fragP;
12082 unsigned int max_prefix_length;
12083
12084 if (fragP->tc_frag_data.classified)
12085 return;
12086
12087 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
12088 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
12089 for (next_fragP = fragP;
12090 next_fragP != NULL;
12091 next_fragP = next_fragP->fr_next)
12092 {
12093 next_fragP->tc_frag_data.classified = 1;
12094 if (next_fragP->fr_type == rs_machine_dependent)
12095 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
12096 {
12097 case BRANCH_PADDING:
12098 /* The BRANCH_PADDING frag must be followed by a branch
12099 frag. */
12100 branch_fragP = i386_next_non_empty_frag (next_fragP);
12101 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
12102 break;
12103 case FUSED_JCC_PADDING:
12104 /* Check if this is a fused jcc:
12105 FUSED_JCC_PADDING
12106 CMP like instruction
12107 BRANCH_PADDING
12108 COND_JUMP
12109 */
12110 cmp_fragP = i386_next_non_empty_frag (next_fragP);
12111 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
79d72f45 12112 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
e379e5f3
L
12113 if (branch_fragP)
12114 {
12115 /* The BRANCH_PADDING frag is merged with the
12116 FUSED_JCC_PADDING frag. */
12117 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
12118 /* CMP like instruction size. */
12119 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
12120 frag_wane (pad_fragP);
12121 /* Skip to branch_fragP. */
12122 next_fragP = branch_fragP;
12123 }
12124 else if (next_fragP->tc_frag_data.max_prefix_length)
12125 {
12126 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
12127 a fused jcc. */
12128 next_fragP->fr_subtype
12129 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
12130 next_fragP->tc_frag_data.max_bytes
12131 = next_fragP->tc_frag_data.max_prefix_length;
12132 /* This will be updated in the BRANCH_PREFIX scan. */
12133 next_fragP->tc_frag_data.max_prefix_length = 0;
12134 }
12135 else
12136 frag_wane (next_fragP);
12137 break;
12138 }
12139 }
12140
12141 /* Stop if there is no BRANCH_PREFIX. */
12142 if (!align_branch_prefix_size)
12143 return;
12144
12145 /* Scan for BRANCH_PREFIX. */
12146 for (; fragP != NULL; fragP = fragP->fr_next)
12147 {
12148 if (fragP->fr_type != rs_machine_dependent
12149 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12150 != BRANCH_PREFIX))
12151 continue;
12152
12153 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
12154 COND_JUMP_PREFIX. */
12155 max_prefix_length = 0;
12156 for (next_fragP = fragP;
12157 next_fragP != NULL;
12158 next_fragP = next_fragP->fr_next)
12159 {
12160 if (next_fragP->fr_type == rs_fill)
12161 /* Skip rs_fill frags. */
12162 continue;
12163 else if (next_fragP->fr_type != rs_machine_dependent)
12164 /* Stop for all other frags. */
12165 break;
12166
12167 /* rs_machine_dependent frags. */
12168 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12169 == BRANCH_PREFIX)
12170 {
12171 /* Count BRANCH_PREFIX frags. */
12172 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
12173 {
12174 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
12175 frag_wane (next_fragP);
12176 }
12177 else
12178 max_prefix_length
12179 += next_fragP->tc_frag_data.max_bytes;
12180 }
12181 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12182 == BRANCH_PADDING)
12183 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12184 == FUSED_JCC_PADDING))
12185 {
12186 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
12187 fragP->tc_frag_data.u.padding_fragP = next_fragP;
12188 break;
12189 }
12190 else
12191 /* Stop for other rs_machine_dependent frags. */
12192 break;
12193 }
12194
12195 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
12196
12197 /* Skip to the next frag. */
12198 fragP = next_fragP;
12199 }
12200}
12201
12202/* Compute padding size for
12203
12204 FUSED_JCC_PADDING
12205 CMP like instruction
12206 BRANCH_PADDING
12207 COND_JUMP/UNCOND_JUMP
12208
12209 or
12210
12211 BRANCH_PADDING
12212 COND_JUMP/UNCOND_JUMP
12213 */
12214
12215static int
12216i386_branch_padding_size (fragS *fragP, offsetT address)
12217{
12218 unsigned int offset, size, padding_size;
12219 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
12220
12221 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
12222 if (!address)
12223 address = fragP->fr_address;
12224 address += fragP->fr_fix;
12225
12226 /* CMP like instrunction size. */
12227 size = fragP->tc_frag_data.cmp_size;
12228
12229 /* The base size of the branch frag. */
12230 size += branch_fragP->fr_fix;
12231
12232 /* Add opcode and displacement bytes for the rs_machine_dependent
12233 branch frag. */
12234 if (branch_fragP->fr_type == rs_machine_dependent)
12235 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
12236
12237 /* Check if branch is within boundary and doesn't end at the last
12238 byte. */
12239 offset = address & ((1U << align_branch_power) - 1);
12240 if ((offset + size) >= (1U << align_branch_power))
12241 /* Padding needed to avoid crossing boundary. */
12242 padding_size = (1U << align_branch_power) - offset;
12243 else
12244 /* No padding needed. */
12245 padding_size = 0;
12246
12247 /* The return value may be saved in tc_frag_data.length which is
12248 unsigned byte. */
12249 if (!fits_in_unsigned_byte (padding_size))
12250 abort ();
12251
12252 return padding_size;
12253}
12254
12255/* i386_generic_table_relax_frag()
12256
12257 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
12258 grow/shrink padding to align branch frags. Hand others to
12259 relax_frag(). */
12260
12261long
12262i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
12263{
12264 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12265 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12266 {
12267 long padding_size = i386_branch_padding_size (fragP, 0);
12268 long grow = padding_size - fragP->tc_frag_data.length;
12269
12270 /* When the BRANCH_PREFIX frag is used, the computed address
12271 must match the actual address and there should be no padding. */
12272 if (fragP->tc_frag_data.padding_address
12273 && (fragP->tc_frag_data.padding_address != fragP->fr_address
12274 || padding_size))
12275 abort ();
12276
12277 /* Update the padding size. */
12278 if (grow)
12279 fragP->tc_frag_data.length = padding_size;
12280
12281 return grow;
12282 }
12283 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12284 {
12285 fragS *padding_fragP, *next_fragP;
12286 long padding_size, left_size, last_size;
12287
12288 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12289 if (!padding_fragP)
12290 /* Use the padding set by the leading BRANCH_PREFIX frag. */
12291 return (fragP->tc_frag_data.length
12292 - fragP->tc_frag_data.last_length);
12293
12294 /* Compute the relative address of the padding frag in the very
12295 first time where the BRANCH_PREFIX frag sizes are zero. */
12296 if (!fragP->tc_frag_data.padding_address)
12297 fragP->tc_frag_data.padding_address
12298 = padding_fragP->fr_address - (fragP->fr_address - stretch);
12299
12300 /* First update the last length from the previous interation. */
12301 left_size = fragP->tc_frag_data.prefix_length;
12302 for (next_fragP = fragP;
12303 next_fragP != padding_fragP;
12304 next_fragP = next_fragP->fr_next)
12305 if (next_fragP->fr_type == rs_machine_dependent
12306 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12307 == BRANCH_PREFIX))
12308 {
12309 if (left_size)
12310 {
12311 int max = next_fragP->tc_frag_data.max_bytes;
12312 if (max)
12313 {
12314 int size;
12315 if (max > left_size)
12316 size = left_size;
12317 else
12318 size = max;
12319 left_size -= size;
12320 next_fragP->tc_frag_data.last_length = size;
12321 }
12322 }
12323 else
12324 next_fragP->tc_frag_data.last_length = 0;
12325 }
12326
12327 /* Check the padding size for the padding frag. */
12328 padding_size = i386_branch_padding_size
12329 (padding_fragP, (fragP->fr_address
12330 + fragP->tc_frag_data.padding_address));
12331
12332 last_size = fragP->tc_frag_data.prefix_length;
12333 /* Check if there is change from the last interation. */
12334 if (padding_size == last_size)
12335 {
12336 /* Update the expected address of the padding frag. */
12337 padding_fragP->tc_frag_data.padding_address
12338 = (fragP->fr_address + padding_size
12339 + fragP->tc_frag_data.padding_address);
12340 return 0;
12341 }
12342
12343 if (padding_size > fragP->tc_frag_data.max_prefix_length)
12344 {
12345 /* No padding if there is no sufficient room. Clear the
12346 expected address of the padding frag. */
12347 padding_fragP->tc_frag_data.padding_address = 0;
12348 padding_size = 0;
12349 }
12350 else
12351 /* Store the expected address of the padding frag. */
12352 padding_fragP->tc_frag_data.padding_address
12353 = (fragP->fr_address + padding_size
12354 + fragP->tc_frag_data.padding_address);
12355
12356 fragP->tc_frag_data.prefix_length = padding_size;
12357
12358 /* Update the length for the current interation. */
12359 left_size = padding_size;
12360 for (next_fragP = fragP;
12361 next_fragP != padding_fragP;
12362 next_fragP = next_fragP->fr_next)
12363 if (next_fragP->fr_type == rs_machine_dependent
12364 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12365 == BRANCH_PREFIX))
12366 {
12367 if (left_size)
12368 {
12369 int max = next_fragP->tc_frag_data.max_bytes;
12370 if (max)
12371 {
12372 int size;
12373 if (max > left_size)
12374 size = left_size;
12375 else
12376 size = max;
12377 left_size -= size;
12378 next_fragP->tc_frag_data.length = size;
12379 }
12380 }
12381 else
12382 next_fragP->tc_frag_data.length = 0;
12383 }
12384
12385 return (fragP->tc_frag_data.length
12386 - fragP->tc_frag_data.last_length);
12387 }
12388 return relax_frag (segment, fragP, stretch);
12389}
12390
ee7fcc42
AM
12391/* md_estimate_size_before_relax()
12392
12393 Called just before relax() for rs_machine_dependent frags. The x86
12394 assembler uses these frags to handle variable size jump
12395 instructions.
12396
12397 Any symbol that is now undefined will not become defined.
12398 Return the correct fr_subtype in the frag.
12399 Return the initial "guess for variable size of frag" to caller.
12400 The guess is actually the growth beyond the fixed part. Whatever
12401 we do to grow the fixed or variable part contributes to our
12402 returned value. */
12403
252b5132 12404int
7016a5d5 12405md_estimate_size_before_relax (fragS *fragP, segT segment)
252b5132 12406{
e379e5f3
L
12407 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12408 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12409 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12410 {
12411 i386_classify_machine_dependent_frag (fragP);
12412 return fragP->tc_frag_data.length;
12413 }
12414
252b5132 12415 /* We've already got fragP->fr_subtype right; all we have to do is
b98ef147
AM
12416 check for un-relaxable symbols. On an ELF system, we can't relax
12417 an externally visible symbol, because it may be overridden by a
12418 shared library. */
12419 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
6d249963 12420#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12421 || (IS_ELF
8dcea932
L
12422 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12423 fragP->fr_var))
fbeb56a4
DK
12424#endif
12425#if defined (OBJ_COFF) && defined (TE_PE)
7ab9ffdd 12426 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
fbeb56a4 12427 && S_IS_WEAK (fragP->fr_symbol))
b98ef147
AM
12428#endif
12429 )
252b5132 12430 {
b98ef147
AM
12431 /* Symbol is undefined in this segment, or we need to keep a
12432 reloc so that weak symbols can be overridden. */
12433 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
f86103b7 12434 enum bfd_reloc_code_real reloc_type;
ee7fcc42
AM
12435 unsigned char *opcode;
12436 int old_fr_fix;
eb19308f 12437 fixS *fixP = NULL;
f6af82bd 12438
ee7fcc42 12439 if (fragP->fr_var != NO_RELOC)
1e9cc1c2 12440 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
b98ef147 12441 else if (size == 2)
f6af82bd 12442 reloc_type = BFD_RELOC_16_PCREL;
bd7ab16b 12443#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1ef3994a
JB
12444 else if (fragP->tc_frag_data.code64 && fragP->fr_offset == 0
12445 && need_plt32_p (fragP->fr_symbol))
bd7ab16b
L
12446 reloc_type = BFD_RELOC_X86_64_PLT32;
12447#endif
f6af82bd
AM
12448 else
12449 reloc_type = BFD_RELOC_32_PCREL;
252b5132 12450
ee7fcc42
AM
12451 old_fr_fix = fragP->fr_fix;
12452 opcode = (unsigned char *) fragP->fr_opcode;
12453
fddf5b5b 12454 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
252b5132 12455 {
fddf5b5b
AM
12456 case UNCOND_JUMP:
12457 /* Make jmp (0xeb) a (d)word displacement jump. */
47926f60 12458 opcode[0] = 0xe9;
252b5132 12459 fragP->fr_fix += size;
eb19308f
JB
12460 fixP = fix_new (fragP, old_fr_fix, size,
12461 fragP->fr_symbol,
12462 fragP->fr_offset, 1,
12463 reloc_type);
252b5132
RH
12464 break;
12465
fddf5b5b 12466 case COND_JUMP86:
412167cb
AM
12467 if (size == 2
12468 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
fddf5b5b
AM
12469 {
12470 /* Negate the condition, and branch past an
12471 unconditional jump. */
12472 opcode[0] ^= 1;
12473 opcode[1] = 3;
12474 /* Insert an unconditional jump. */
12475 opcode[2] = 0xe9;
12476 /* We added two extra opcode bytes, and have a two byte
12477 offset. */
12478 fragP->fr_fix += 2 + 2;
062cd5e7
AS
12479 fix_new (fragP, old_fr_fix + 2, 2,
12480 fragP->fr_symbol,
12481 fragP->fr_offset, 1,
12482 reloc_type);
fddf5b5b
AM
12483 break;
12484 }
12485 /* Fall through. */
12486
12487 case COND_JUMP:
412167cb
AM
12488 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12489 {
12490 fragP->fr_fix += 1;
3e02c1cc
AM
12491 fixP = fix_new (fragP, old_fr_fix, 1,
12492 fragP->fr_symbol,
12493 fragP->fr_offset, 1,
12494 BFD_RELOC_8_PCREL);
12495 fixP->fx_signed = 1;
412167cb
AM
12496 break;
12497 }
93c2a809 12498
24eab124 12499 /* This changes the byte-displacement jump 0x7N
fddf5b5b 12500 to the (d)word-displacement jump 0x0f,0x8N. */
252b5132 12501 opcode[1] = opcode[0] + 0x10;
f6af82bd 12502 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
47926f60
KH
12503 /* We've added an opcode byte. */
12504 fragP->fr_fix += 1 + size;
eb19308f
JB
12505 fixP = fix_new (fragP, old_fr_fix + 1, size,
12506 fragP->fr_symbol,
12507 fragP->fr_offset, 1,
12508 reloc_type);
252b5132 12509 break;
fddf5b5b
AM
12510
12511 default:
12512 BAD_CASE (fragP->fr_subtype);
12513 break;
252b5132 12514 }
eb19308f
JB
12515
12516 /* All jumps handled here are signed, but don't unconditionally use a
12517 signed limit check for 32 and 16 bit jumps as we want to allow wrap
12518 around at 4G (outside of 64-bit mode) and 64k. */
12519 if (size == 4 && flag_code == CODE_64BIT)
12520 fixP->fx_signed = 1;
12521
252b5132 12522 frag_wane (fragP);
ee7fcc42 12523 return fragP->fr_fix - old_fr_fix;
252b5132 12524 }
93c2a809 12525
93c2a809
AM
12526 /* Guess size depending on current relax state. Initially the relax
12527 state will correspond to a short jump and we return 1, because
12528 the variable part of the frag (the branch offset) is one byte
12529 long. However, we can relax a section more than once and in that
12530 case we must either set fr_subtype back to the unrelaxed state,
12531 or return the value for the appropriate branch. */
12532 return md_relax_table[fragP->fr_subtype].rlx_length;
ee7fcc42
AM
12533}
12534
47926f60
KH
12535/* Called after relax() is finished.
12536
12537 In: Address of frag.
12538 fr_type == rs_machine_dependent.
12539 fr_subtype is what the address relaxed to.
12540
12541 Out: Any fixSs and constants are set up.
12542 Caller will turn frag into a ".space 0". */
12543
252b5132 12544void
7016a5d5
TG
12545md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12546 fragS *fragP)
252b5132 12547{
29b0f896 12548 unsigned char *opcode;
252b5132 12549 unsigned char *where_to_put_displacement = NULL;
847f7ad4
AM
12550 offsetT target_address;
12551 offsetT opcode_address;
252b5132 12552 unsigned int extension = 0;
847f7ad4 12553 offsetT displacement_from_opcode_start;
252b5132 12554
e379e5f3
L
12555 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12556 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12557 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12558 {
12559 /* Generate nop padding. */
12560 unsigned int size = fragP->tc_frag_data.length;
12561 if (size)
12562 {
12563 if (size > fragP->tc_frag_data.max_bytes)
12564 abort ();
12565
12566 if (flag_debug)
12567 {
12568 const char *msg;
12569 const char *branch = "branch";
12570 const char *prefix = "";
12571 fragS *padding_fragP;
12572 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12573 == BRANCH_PREFIX)
12574 {
12575 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12576 switch (fragP->tc_frag_data.default_prefix)
12577 {
12578 default:
12579 abort ();
12580 break;
12581 case CS_PREFIX_OPCODE:
12582 prefix = " cs";
12583 break;
12584 case DS_PREFIX_OPCODE:
12585 prefix = " ds";
12586 break;
12587 case ES_PREFIX_OPCODE:
12588 prefix = " es";
12589 break;
12590 case FS_PREFIX_OPCODE:
12591 prefix = " fs";
12592 break;
12593 case GS_PREFIX_OPCODE:
12594 prefix = " gs";
12595 break;
12596 case SS_PREFIX_OPCODE:
12597 prefix = " ss";
12598 break;
12599 }
12600 if (padding_fragP)
12601 msg = _("%s:%u: add %d%s at 0x%llx to align "
12602 "%s within %d-byte boundary\n");
12603 else
12604 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12605 "align %s within %d-byte boundary\n");
12606 }
12607 else
12608 {
12609 padding_fragP = fragP;
12610 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12611 "%s within %d-byte boundary\n");
12612 }
12613
12614 if (padding_fragP)
12615 switch (padding_fragP->tc_frag_data.branch_type)
12616 {
12617 case align_branch_jcc:
12618 branch = "jcc";
12619 break;
12620 case align_branch_fused:
12621 branch = "fused jcc";
12622 break;
12623 case align_branch_jmp:
12624 branch = "jmp";
12625 break;
12626 case align_branch_call:
12627 branch = "call";
12628 break;
12629 case align_branch_indirect:
12630 branch = "indiret branch";
12631 break;
12632 case align_branch_ret:
12633 branch = "ret";
12634 break;
12635 default:
12636 break;
12637 }
12638
12639 fprintf (stdout, msg,
12640 fragP->fr_file, fragP->fr_line, size, prefix,
12641 (long long) fragP->fr_address, branch,
12642 1 << align_branch_power);
12643 }
12644 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12645 memset (fragP->fr_opcode,
12646 fragP->tc_frag_data.default_prefix, size);
12647 else
12648 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12649 size, 0);
12650 fragP->fr_fix += size;
12651 }
12652 return;
12653 }
12654
252b5132
RH
12655 opcode = (unsigned char *) fragP->fr_opcode;
12656
47926f60 12657 /* Address we want to reach in file space. */
252b5132 12658 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
252b5132 12659
47926f60 12660 /* Address opcode resides at in file space. */
252b5132
RH
12661 opcode_address = fragP->fr_address + fragP->fr_fix;
12662
47926f60 12663 /* Displacement from opcode start to fill into instruction. */
252b5132
RH
12664 displacement_from_opcode_start = target_address - opcode_address;
12665
fddf5b5b 12666 if ((fragP->fr_subtype & BIG) == 0)
252b5132 12667 {
47926f60
KH
12668 /* Don't have to change opcode. */
12669 extension = 1; /* 1 opcode + 1 displacement */
252b5132 12670 where_to_put_displacement = &opcode[1];
fddf5b5b
AM
12671 }
12672 else
12673 {
12674 if (no_cond_jump_promotion
12675 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4eed87de
AM
12676 as_warn_where (fragP->fr_file, fragP->fr_line,
12677 _("long jump required"));
252b5132 12678
fddf5b5b
AM
12679 switch (fragP->fr_subtype)
12680 {
12681 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12682 extension = 4; /* 1 opcode + 4 displacement */
12683 opcode[0] = 0xe9;
12684 where_to_put_displacement = &opcode[1];
12685 break;
252b5132 12686
fddf5b5b
AM
12687 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12688 extension = 2; /* 1 opcode + 2 displacement */
12689 opcode[0] = 0xe9;
12690 where_to_put_displacement = &opcode[1];
12691 break;
252b5132 12692
fddf5b5b
AM
12693 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12694 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12695 extension = 5; /* 2 opcode + 4 displacement */
12696 opcode[1] = opcode[0] + 0x10;
12697 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12698 where_to_put_displacement = &opcode[2];
12699 break;
252b5132 12700
fddf5b5b
AM
12701 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12702 extension = 3; /* 2 opcode + 2 displacement */
12703 opcode[1] = opcode[0] + 0x10;
12704 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12705 where_to_put_displacement = &opcode[2];
12706 break;
252b5132 12707
fddf5b5b
AM
12708 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12709 extension = 4;
12710 opcode[0] ^= 1;
12711 opcode[1] = 3;
12712 opcode[2] = 0xe9;
12713 where_to_put_displacement = &opcode[3];
12714 break;
12715
12716 default:
12717 BAD_CASE (fragP->fr_subtype);
12718 break;
12719 }
252b5132 12720 }
fddf5b5b 12721
7b81dfbb
AJ
12722 /* If size if less then four we are sure that the operand fits,
12723 but if it's 4, then it could be that the displacement is larger
12724 then -/+ 2GB. */
12725 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12726 && object_64bit
12727 && ((addressT) (displacement_from_opcode_start - extension
4eed87de
AM
12728 + ((addressT) 1 << 31))
12729 > (((addressT) 2 << 31) - 1)))
7b81dfbb
AJ
12730 {
12731 as_bad_where (fragP->fr_file, fragP->fr_line,
12732 _("jump target out of range"));
12733 /* Make us emit 0. */
12734 displacement_from_opcode_start = extension;
12735 }
47926f60 12736 /* Now put displacement after opcode. */
252b5132
RH
12737 md_number_to_chars ((char *) where_to_put_displacement,
12738 (valueT) (displacement_from_opcode_start - extension),
fddf5b5b 12739 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
252b5132
RH
12740 fragP->fr_fix += extension;
12741}
12742\f
7016a5d5 12743/* Apply a fixup (fixP) to segment data, once it has been determined
252b5132
RH
12744 by our caller that we have all the info we need to fix it up.
12745
7016a5d5
TG
12746 Parameter valP is the pointer to the value of the bits.
12747
252b5132
RH
12748 On the 386, immediates, displacements, and data pointers are all in
12749 the same (little-endian) format, so we don't need to care about which
12750 we are handling. */
12751
94f592af 12752void
7016a5d5 12753md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
252b5132 12754{
94f592af 12755 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
c6682705 12756 valueT value = *valP;
252b5132 12757
f86103b7 12758#if !defined (TE_Mach)
93382f6d
AM
12759 if (fixP->fx_pcrel)
12760 {
12761 switch (fixP->fx_r_type)
12762 {
5865bb77
ILT
12763 default:
12764 break;
12765
d6ab8113
JB
12766 case BFD_RELOC_64:
12767 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12768 break;
93382f6d 12769 case BFD_RELOC_32:
ae8887b5 12770 case BFD_RELOC_X86_64_32S:
93382f6d
AM
12771 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12772 break;
12773 case BFD_RELOC_16:
12774 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12775 break;
12776 case BFD_RELOC_8:
12777 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12778 break;
12779 }
12780 }
252b5132 12781
a161fe53 12782 if (fixP->fx_addsy != NULL
31312f95 12783 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
d6ab8113 12784 || fixP->fx_r_type == BFD_RELOC_64_PCREL
31312f95 12785 || fixP->fx_r_type == BFD_RELOC_16_PCREL
d258b828 12786 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
31312f95 12787 && !use_rela_relocations)
252b5132 12788 {
31312f95
AM
12789 /* This is a hack. There should be a better way to handle this.
12790 This covers for the fact that bfd_install_relocation will
12791 subtract the current location (for partial_inplace, PC relative
12792 relocations); see more below. */
252b5132 12793#ifndef OBJ_AOUT
718ddfc0 12794 if (IS_ELF
252b5132
RH
12795#ifdef TE_PE
12796 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12797#endif
12798 )
12799 value += fixP->fx_where + fixP->fx_frag->fr_address;
12800#endif
12801#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12802 if (IS_ELF)
252b5132 12803 {
6539b54b 12804 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
2f66722d 12805
6539b54b 12806 if ((sym_seg == seg
2f66722d 12807 || (symbol_section_p (fixP->fx_addsy)
6539b54b 12808 && sym_seg != absolute_section))
af65af87 12809 && !generic_force_reloc (fixP))
2f66722d
AM
12810 {
12811 /* Yes, we add the values in twice. This is because
6539b54b
AM
12812 bfd_install_relocation subtracts them out again. I think
12813 bfd_install_relocation is broken, but I don't dare change
2f66722d
AM
12814 it. FIXME. */
12815 value += fixP->fx_where + fixP->fx_frag->fr_address;
12816 }
252b5132
RH
12817 }
12818#endif
12819#if defined (OBJ_COFF) && defined (TE_PE)
977cdf5a
NC
12820 /* For some reason, the PE format does not store a
12821 section address offset for a PC relative symbol. */
12822 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
7be1c489 12823 || S_IS_WEAK (fixP->fx_addsy))
252b5132
RH
12824 value += md_pcrel_from (fixP);
12825#endif
12826 }
fbeb56a4 12827#if defined (OBJ_COFF) && defined (TE_PE)
f01c1a09
NC
12828 if (fixP->fx_addsy != NULL
12829 && S_IS_WEAK (fixP->fx_addsy)
12830 /* PR 16858: Do not modify weak function references. */
12831 && ! fixP->fx_pcrel)
fbeb56a4 12832 {
296a8689
NC
12833#if !defined (TE_PEP)
12834 /* For x86 PE weak function symbols are neither PC-relative
12835 nor do they set S_IS_FUNCTION. So the only reliable way
12836 to detect them is to check the flags of their containing
12837 section. */
12838 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12839 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12840 ;
12841 else
12842#endif
fbeb56a4
DK
12843 value -= S_GET_VALUE (fixP->fx_addsy);
12844 }
12845#endif
252b5132
RH
12846
12847 /* Fix a few things - the dynamic linker expects certain values here,
0234cb7c 12848 and we must not disappoint it. */
252b5132 12849#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12850 if (IS_ELF && fixP->fx_addsy)
47926f60
KH
12851 switch (fixP->fx_r_type)
12852 {
12853 case BFD_RELOC_386_PLT32:
3e73aa7c 12854 case BFD_RELOC_X86_64_PLT32:
b9519cfe
L
12855 /* Make the jump instruction point to the address of the operand.
12856 At runtime we merely add the offset to the actual PLT entry.
12857 NB: Subtract the offset size only for jump instructions. */
12858 if (fixP->fx_pcrel)
12859 value = -4;
47926f60 12860 break;
31312f95 12861
13ae64f3
JJ
12862 case BFD_RELOC_386_TLS_GD:
12863 case BFD_RELOC_386_TLS_LDM:
13ae64f3 12864 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
12865 case BFD_RELOC_386_TLS_IE:
12866 case BFD_RELOC_386_TLS_GOTIE:
67a4f2b7 12867 case BFD_RELOC_386_TLS_GOTDESC:
bffbf940
JJ
12868 case BFD_RELOC_X86_64_TLSGD:
12869 case BFD_RELOC_X86_64_TLSLD:
12870 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7 12871 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
00f7efb6
JJ
12872 value = 0; /* Fully resolved at runtime. No addend. */
12873 /* Fallthrough */
12874 case BFD_RELOC_386_TLS_LE:
12875 case BFD_RELOC_386_TLS_LDO_32:
12876 case BFD_RELOC_386_TLS_LE_32:
12877 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 12878 case BFD_RELOC_X86_64_DTPOFF64:
00f7efb6 12879 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113 12880 case BFD_RELOC_X86_64_TPOFF64:
00f7efb6
JJ
12881 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12882 break;
12883
67a4f2b7
AO
12884 case BFD_RELOC_386_TLS_DESC_CALL:
12885 case BFD_RELOC_X86_64_TLSDESC_CALL:
12886 value = 0; /* Fully resolved at runtime. No addend. */
12887 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12888 fixP->fx_done = 0;
12889 return;
12890
47926f60
KH
12891 case BFD_RELOC_VTABLE_INHERIT:
12892 case BFD_RELOC_VTABLE_ENTRY:
12893 fixP->fx_done = 0;
94f592af 12894 return;
47926f60
KH
12895
12896 default:
12897 break;
12898 }
12899#endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
a442cac5
JB
12900
12901 /* If not 64bit, massage value, to account for wraparound when !BFD64. */
12902 if (!object_64bit)
12903 value = extend_to_32bit_address (value);
12904
c6682705 12905 *valP = value;
f86103b7 12906#endif /* !defined (TE_Mach) */
3e73aa7c 12907
3e73aa7c 12908 /* Are we finished with this relocation now? */
c6682705 12909 if (fixP->fx_addsy == NULL)
b8188555
JB
12910 {
12911 fixP->fx_done = 1;
12912 switch (fixP->fx_r_type)
12913 {
12914 case BFD_RELOC_X86_64_32S:
12915 fixP->fx_signed = 1;
12916 break;
12917
12918 default:
12919 break;
12920 }
12921 }
fbeb56a4
DK
12922#if defined (OBJ_COFF) && defined (TE_PE)
12923 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12924 {
12925 fixP->fx_done = 0;
12926 /* Remember value for tc_gen_reloc. */
12927 fixP->fx_addnumber = value;
12928 /* Clear out the frag for now. */
12929 value = 0;
12930 }
12931#endif
3e73aa7c
JH
12932 else if (use_rela_relocations)
12933 {
46fb6d5a
JB
12934 if (!disallow_64bit_reloc || fixP->fx_r_type == NO_RELOC)
12935 fixP->fx_no_overflow = 1;
062cd5e7
AS
12936 /* Remember value for tc_gen_reloc. */
12937 fixP->fx_addnumber = value;
3e73aa7c
JH
12938 value = 0;
12939 }
f86103b7 12940
94f592af 12941 md_number_to_chars (p, value, fixP->fx_size);
252b5132 12942}
252b5132 12943\f
6d4af3c2 12944const char *
499ac353 12945md_atof (int type, char *litP, int *sizeP)
252b5132 12946{
499ac353
NC
12947 /* This outputs the LITTLENUMs in REVERSE order;
12948 in accord with the bigendian 386. */
5b7c81bd 12949 return ieee_md_atof (type, litP, sizeP, false);
252b5132
RH
12950}
12951\f
2d545b82 12952static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
252b5132 12953
252b5132 12954static char *
e3bb37b5 12955output_invalid (int c)
252b5132 12956{
3882b010 12957 if (ISPRINT (c))
f9f21a03
L
12958 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12959 "'%c'", c);
252b5132 12960 else
f9f21a03 12961 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
2d545b82 12962 "(0x%x)", (unsigned char) c);
252b5132
RH
12963 return output_invalid_buf;
12964}
12965
8a6fb3f9
JB
12966/* Verify that @r can be used in the current context. */
12967
5b7c81bd 12968static bool check_register (const reg_entry *r)
8a6fb3f9
JB
12969{
12970 if (allow_pseudo_reg)
5b7c81bd 12971 return true;
8a6fb3f9
JB
12972
12973 if (operand_type_all_zero (&r->reg_type))
5b7c81bd 12974 return false;
8a6fb3f9
JB
12975
12976 if ((r->reg_type.bitfield.dword
12977 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12978 || r->reg_type.bitfield.class == RegCR
22e00a3f 12979 || r->reg_type.bitfield.class == RegDR)
8a6fb3f9 12980 && !cpu_arch_flags.bitfield.cpui386)
5b7c81bd 12981 return false;
8a6fb3f9 12982
22e00a3f
JB
12983 if (r->reg_type.bitfield.class == RegTR
12984 && (flag_code == CODE_64BIT
12985 || !cpu_arch_flags.bitfield.cpui386
12986 || cpu_arch_isa_flags.bitfield.cpui586
12987 || cpu_arch_isa_flags.bitfield.cpui686))
5b7c81bd 12988 return false;
22e00a3f 12989
8a6fb3f9 12990 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
5b7c81bd 12991 return false;
8a6fb3f9
JB
12992
12993 if (!cpu_arch_flags.bitfield.cpuavx512f)
12994 {
12995 if (r->reg_type.bitfield.zmmword
12996 || r->reg_type.bitfield.class == RegMask)
5b7c81bd 12997 return false;
8a6fb3f9
JB
12998
12999 if (!cpu_arch_flags.bitfield.cpuavx)
13000 {
13001 if (r->reg_type.bitfield.ymmword)
5b7c81bd 13002 return false;
8a6fb3f9
JB
13003
13004 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
5b7c81bd 13005 return false;
8a6fb3f9
JB
13006 }
13007 }
13008
260cd341
LC
13009 if (r->reg_type.bitfield.tmmword
13010 && (!cpu_arch_flags.bitfield.cpuamx_tile
13011 || flag_code != CODE_64BIT))
5b7c81bd 13012 return false;
260cd341 13013
8a6fb3f9 13014 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
5b7c81bd 13015 return false;
8a6fb3f9
JB
13016
13017 /* Don't allow fake index register unless allow_index_reg isn't 0. */
13018 if (!allow_index_reg && r->reg_num == RegIZ)
5b7c81bd 13019 return false;
8a6fb3f9
JB
13020
13021 /* Upper 16 vector registers are only available with VREX in 64bit
13022 mode, and require EVEX encoding. */
13023 if (r->reg_flags & RegVRex)
13024 {
13025 if (!cpu_arch_flags.bitfield.cpuavx512f
13026 || flag_code != CODE_64BIT)
5b7c81bd 13027 return false;
8a6fb3f9 13028
da4977e0
JB
13029 if (i.vec_encoding == vex_encoding_default)
13030 i.vec_encoding = vex_encoding_evex;
13031 else if (i.vec_encoding != vex_encoding_evex)
13032 i.vec_encoding = vex_encoding_error;
8a6fb3f9
JB
13033 }
13034
13035 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
13036 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
13037 && flag_code != CODE_64BIT)
5b7c81bd 13038 return false;
8a6fb3f9
JB
13039
13040 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
13041 && !intel_syntax)
5b7c81bd 13042 return false;
8a6fb3f9 13043
5b7c81bd 13044 return true;
8a6fb3f9
JB
13045}
13046
af6bdddf 13047/* REG_STRING starts *before* REGISTER_PREFIX. */
252b5132
RH
13048
13049static const reg_entry *
4d1bb795 13050parse_real_register (char *reg_string, char **end_op)
252b5132 13051{
af6bdddf
AM
13052 char *s = reg_string;
13053 char *p;
252b5132
RH
13054 char reg_name_given[MAX_REG_NAME_SIZE + 1];
13055 const reg_entry *r;
13056
13057 /* Skip possible REGISTER_PREFIX and possible whitespace. */
13058 if (*s == REGISTER_PREFIX)
13059 ++s;
13060
13061 if (is_space_char (*s))
13062 ++s;
13063
13064 p = reg_name_given;
af6bdddf 13065 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
252b5132
RH
13066 {
13067 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
af6bdddf
AM
13068 return (const reg_entry *) NULL;
13069 s++;
252b5132
RH
13070 }
13071
6588847e
DN
13072 /* For naked regs, make sure that we are not dealing with an identifier.
13073 This prevents confusing an identifier like `eax_var' with register
13074 `eax'. */
13075 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
13076 return (const reg_entry *) NULL;
13077
af6bdddf 13078 *end_op = s;
252b5132 13079
629310ab 13080 r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
252b5132 13081
5f47d35b 13082 /* Handle floating point regs, allowing spaces in the (i) part. */
6288d05f 13083 if (r == reg_st0)
5f47d35b 13084 {
0e0eea78
JB
13085 if (!cpu_arch_flags.bitfield.cpu8087
13086 && !cpu_arch_flags.bitfield.cpu287
af32b722
JB
13087 && !cpu_arch_flags.bitfield.cpu387
13088 && !allow_pseudo_reg)
0e0eea78
JB
13089 return (const reg_entry *) NULL;
13090
5f47d35b
AM
13091 if (is_space_char (*s))
13092 ++s;
13093 if (*s == '(')
13094 {
af6bdddf 13095 ++s;
5f47d35b
AM
13096 if (is_space_char (*s))
13097 ++s;
13098 if (*s >= '0' && *s <= '7')
13099 {
db557034 13100 int fpr = *s - '0';
af6bdddf 13101 ++s;
5f47d35b
AM
13102 if (is_space_char (*s))
13103 ++s;
13104 if (*s == ')')
13105 {
13106 *end_op = s + 1;
6288d05f 13107 know (r[fpr].reg_num == fpr);
db557034 13108 return r + fpr;
5f47d35b 13109 }
5f47d35b 13110 }
47926f60 13111 /* We have "%st(" then garbage. */
5f47d35b
AM
13112 return (const reg_entry *) NULL;
13113 }
13114 }
13115
8a6fb3f9 13116 return r && check_register (r) ? r : NULL;
252b5132 13117}
4d1bb795
JB
13118
13119/* REG_STRING starts *before* REGISTER_PREFIX. */
13120
13121static const reg_entry *
13122parse_register (char *reg_string, char **end_op)
13123{
13124 const reg_entry *r;
13125
13126 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
13127 r = parse_real_register (reg_string, end_op);
13128 else
13129 r = NULL;
13130 if (!r)
13131 {
13132 char *save = input_line_pointer;
13133 char c;
13134 symbolS *symbolP;
13135
13136 input_line_pointer = reg_string;
d02603dc 13137 c = get_symbol_name (&reg_string);
4d1bb795 13138 symbolP = symbol_find (reg_string);
64d23078
JB
13139 while (symbolP && S_GET_SEGMENT (symbolP) != reg_section)
13140 {
13141 const expressionS *e = symbol_get_value_expression(symbolP);
13142
13143 if (e->X_op != O_symbol || e->X_add_number)
13144 break;
13145 symbolP = e->X_add_symbol;
13146 }
4d1bb795
JB
13147 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
13148 {
13149 const expressionS *e = symbol_get_value_expression (symbolP);
13150
0ccade1a
JB
13151 if (e->X_op == O_register)
13152 {
13153 know (e->X_add_number >= 0
13154 && (valueT) e->X_add_number < i386_regtab_size);
13155 r = i386_regtab + e->X_add_number;
13156 *end_op = input_line_pointer;
13157 }
13158 if (r && !check_register (r))
8a6fb3f9 13159 {
3b55a1d0
JB
13160 as_bad (_("register '%s%s' cannot be used here"),
13161 register_prefix, r->reg_name);
13162 r = &bad_reg;
8a6fb3f9 13163 }
4d1bb795
JB
13164 }
13165 *input_line_pointer = c;
13166 input_line_pointer = save;
13167 }
13168 return r;
13169}
13170
13171int
13172i386_parse_name (char *name, expressionS *e, char *nextcharP)
13173{
4faaa10f 13174 const reg_entry *r = NULL;
4d1bb795
JB
13175 char *end = input_line_pointer;
13176
13177 *end = *nextcharP;
4faaa10f
JB
13178 if (*name == REGISTER_PREFIX || allow_naked_reg)
13179 r = parse_real_register (name, &input_line_pointer);
4d1bb795
JB
13180 if (r && end <= input_line_pointer)
13181 {
13182 *nextcharP = *input_line_pointer;
13183 *input_line_pointer = 0;
8a6fb3f9
JB
13184 if (r != &bad_reg)
13185 {
13186 e->X_op = O_register;
13187 e->X_add_number = r - i386_regtab;
13188 }
13189 else
13190 e->X_op = O_illegal;
4d1bb795
JB
13191 return 1;
13192 }
13193 input_line_pointer = end;
13194 *end = 0;
ee86248c 13195 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
4d1bb795
JB
13196}
13197
13198void
13199md_operand (expressionS *e)
13200{
ee86248c
JB
13201 char *end;
13202 const reg_entry *r;
4d1bb795 13203
ee86248c
JB
13204 switch (*input_line_pointer)
13205 {
13206 case REGISTER_PREFIX:
13207 r = parse_real_register (input_line_pointer, &end);
4d1bb795
JB
13208 if (r)
13209 {
13210 e->X_op = O_register;
13211 e->X_add_number = r - i386_regtab;
13212 input_line_pointer = end;
13213 }
ee86248c
JB
13214 break;
13215
13216 case '[':
9c2799c2 13217 gas_assert (intel_syntax);
ee86248c
JB
13218 end = input_line_pointer++;
13219 expression (e);
13220 if (*input_line_pointer == ']')
13221 {
13222 ++input_line_pointer;
13223 e->X_op_symbol = make_expr_symbol (e);
13224 e->X_add_symbol = NULL;
13225 e->X_add_number = 0;
13226 e->X_op = O_index;
13227 }
13228 else
13229 {
13230 e->X_op = O_absent;
13231 input_line_pointer = end;
13232 }
13233 break;
4d1bb795
JB
13234 }
13235}
13236
252b5132 13237\f
4cc782b5 13238#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
b6f8c7c4 13239const char *md_shortopts = "kVQ:sqnO::";
252b5132 13240#else
b6f8c7c4 13241const char *md_shortopts = "qnO::";
252b5132 13242#endif
6e0b89ee 13243
3e73aa7c 13244#define OPTION_32 (OPTION_MD_BASE + 0)
b3b91714
AM
13245#define OPTION_64 (OPTION_MD_BASE + 1)
13246#define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9103f4f4
L
13247#define OPTION_MARCH (OPTION_MD_BASE + 3)
13248#define OPTION_MTUNE (OPTION_MD_BASE + 4)
1efbbeb4
L
13249#define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
13250#define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
13251#define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
13252#define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
bd5dea88 13253#define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
c0f3af97 13254#define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
daf50ae7 13255#define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
7bab8ab5
JB
13256#define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
13257#define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
13258#define OPTION_X32 (OPTION_MD_BASE + 14)
7e8b059b 13259#define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
43234a1e
L
13260#define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
13261#define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
167ad85b 13262#define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
d1982f93 13263#define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
d3d3c6db 13264#define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
8dcea932 13265#define OPTION_MSHARED (OPTION_MD_BASE + 21)
5db04b09
L
13266#define OPTION_MAMD64 (OPTION_MD_BASE + 22)
13267#define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
e4e00185 13268#define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
b4a3a7b4 13269#define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
03751133 13270#define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
e379e5f3
L
13271#define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
13272#define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
13273#define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
76cf450b 13274#define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
ae531041
L
13275#define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
13276#define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
13277#define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
c8480b58 13278#define OPTION_MUSE_UNALIGNED_VECTOR_MOVE (OPTION_MD_BASE + 34)
b3b91714 13279
99ad8390
NC
13280struct option md_longopts[] =
13281{
3e73aa7c 13282 {"32", no_argument, NULL, OPTION_32},
321098a5 13283#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 13284 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c 13285 {"64", no_argument, NULL, OPTION_64},
351f65ca
L
13286#endif
13287#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 13288 {"x32", no_argument, NULL, OPTION_X32},
8dcea932 13289 {"mshared", no_argument, NULL, OPTION_MSHARED},
b4a3a7b4 13290 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
6e0b89ee 13291#endif
b3b91714 13292 {"divide", no_argument, NULL, OPTION_DIVIDE},
9103f4f4
L
13293 {"march", required_argument, NULL, OPTION_MARCH},
13294 {"mtune", required_argument, NULL, OPTION_MTUNE},
1efbbeb4
L
13295 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
13296 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
13297 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
13298 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
c0f3af97 13299 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
c8480b58 13300 {"muse-unaligned-vector-move", no_argument, NULL, OPTION_MUSE_UNALIGNED_VECTOR_MOVE},
daf50ae7 13301 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
7bab8ab5 13302 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
539f890d 13303 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
03751133 13304 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
7e8b059b 13305 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
43234a1e
L
13306 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
13307 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
167ad85b
TG
13308# if defined (TE_PE) || defined (TE_PEP)
13309 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
13310#endif
d1982f93 13311 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
e4e00185 13312 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
0cb4071e 13313 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
d3d3c6db 13314 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
e379e5f3
L
13315 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
13316 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
13317 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
76cf450b 13318 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
ae531041
L
13319 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
13320 {"mlfence-before-indirect-branch", required_argument, NULL,
13321 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
13322 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
5db04b09
L
13323 {"mamd64", no_argument, NULL, OPTION_MAMD64},
13324 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
252b5132
RH
13325 {NULL, no_argument, NULL, 0}
13326};
13327size_t md_longopts_size = sizeof (md_longopts);
13328
13329int
17b9d67d 13330md_parse_option (int c, const char *arg)
252b5132 13331{
91d6fa6a 13332 unsigned int j;
e379e5f3 13333 char *arch, *next, *saved, *type;
9103f4f4 13334
252b5132
RH
13335 switch (c)
13336 {
12b55ccc
L
13337 case 'n':
13338 optimize_align_code = 0;
13339 break;
13340
a38cf1db
AM
13341 case 'q':
13342 quiet_warnings = 1;
252b5132
RH
13343 break;
13344
13345#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
a38cf1db
AM
13346 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
13347 should be emitted or not. FIXME: Not implemented. */
13348 case 'Q':
d4693039
JB
13349 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
13350 return 0;
252b5132
RH
13351 break;
13352
13353 /* -V: SVR4 argument to print version ID. */
13354 case 'V':
13355 print_version_id ();
13356 break;
13357
a38cf1db
AM
13358 /* -k: Ignore for FreeBSD compatibility. */
13359 case 'k':
252b5132 13360 break;
4cc782b5
ILT
13361
13362 case 's':
13363 /* -s: On i386 Solaris, this tells the native assembler to use
29b0f896 13364 .stab instead of .stab.excl. We always use .stab anyhow. */
4cc782b5 13365 break;
8dcea932
L
13366
13367 case OPTION_MSHARED:
13368 shared = 1;
13369 break;
b4a3a7b4
L
13370
13371 case OPTION_X86_USED_NOTE:
13372 if (strcasecmp (arg, "yes") == 0)
13373 x86_used_note = 1;
13374 else if (strcasecmp (arg, "no") == 0)
13375 x86_used_note = 0;
13376 else
13377 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
13378 break;
13379
13380
99ad8390 13381#endif
321098a5 13382#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 13383 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c
JH
13384 case OPTION_64:
13385 {
13386 const char **list, **l;
13387
3e73aa7c
JH
13388 list = bfd_target_list ();
13389 for (l = list; *l != NULL; l++)
08dedd66 13390 if (startswith (*l, "elf64-x86-64")
99ad8390
NC
13391 || strcmp (*l, "coff-x86-64") == 0
13392 || strcmp (*l, "pe-x86-64") == 0
d382c579
TG
13393 || strcmp (*l, "pei-x86-64") == 0
13394 || strcmp (*l, "mach-o-x86-64") == 0)
6e0b89ee
AM
13395 {
13396 default_arch = "x86_64";
13397 break;
13398 }
3e73aa7c 13399 if (*l == NULL)
2b5d6a91 13400 as_fatal (_("no compiled in support for x86_64"));
3e73aa7c
JH
13401 free (list);
13402 }
13403 break;
13404#endif
252b5132 13405
351f65ca 13406#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 13407 case OPTION_X32:
351f65ca
L
13408 if (IS_ELF)
13409 {
13410 const char **list, **l;
13411
13412 list = bfd_target_list ();
13413 for (l = list; *l != NULL; l++)
08dedd66 13414 if (startswith (*l, "elf32-x86-64"))
351f65ca
L
13415 {
13416 default_arch = "x86_64:32";
13417 break;
13418 }
13419 if (*l == NULL)
2b5d6a91 13420 as_fatal (_("no compiled in support for 32bit x86_64"));
351f65ca
L
13421 free (list);
13422 }
13423 else
13424 as_fatal (_("32bit x86_64 is only supported for ELF"));
13425 break;
13426#endif
13427
6e0b89ee
AM
13428 case OPTION_32:
13429 default_arch = "i386";
13430 break;
13431
b3b91714
AM
13432 case OPTION_DIVIDE:
13433#ifdef SVR4_COMMENT_CHARS
13434 {
13435 char *n, *t;
13436 const char *s;
13437
add39d23 13438 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
b3b91714
AM
13439 t = n;
13440 for (s = i386_comment_chars; *s != '\0'; s++)
13441 if (*s != '/')
13442 *t++ = *s;
13443 *t = '\0';
13444 i386_comment_chars = n;
13445 }
13446#endif
13447 break;
13448
9103f4f4 13449 case OPTION_MARCH:
293f5f65
L
13450 saved = xstrdup (arg);
13451 arch = saved;
13452 /* Allow -march=+nosse. */
13453 if (*arch == '+')
13454 arch++;
6305a203 13455 do
9103f4f4 13456 {
6305a203 13457 if (*arch == '.')
2b5d6a91 13458 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
13459 next = strchr (arch, '+');
13460 if (next)
13461 *next++ = '\0';
91d6fa6a 13462 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 13463 {
ae89daec
JB
13464 if (arch == saved && cpu_arch[j].type != PROCESSOR_NONE
13465 && strcmp (arch, cpu_arch[j].name) == 0)
ccc9c027 13466 {
6305a203 13467 /* Processor. */
ae89daec 13468 if (! cpu_arch[j].enable.bitfield.cpui386)
1ded5609
JB
13469 continue;
13470
91d6fa6a 13471 cpu_arch_name = cpu_arch[j].name;
d92c7521 13472 free (cpu_sub_arch_name);
6305a203 13473 cpu_sub_arch_name = NULL;
ae89daec 13474 cpu_arch_flags = cpu_arch[j].enable;
91d6fa6a 13475 cpu_arch_isa = cpu_arch[j].type;
ae89daec 13476 cpu_arch_isa_flags = cpu_arch[j].enable;
6305a203
L
13477 if (!cpu_arch_tune_set)
13478 {
13479 cpu_arch_tune = cpu_arch_isa;
13480 cpu_arch_tune_flags = cpu_arch_isa_flags;
13481 }
13482 break;
13483 }
ae89daec
JB
13484 else if (cpu_arch[j].type == PROCESSOR_NONE
13485 && strcmp (arch, cpu_arch[j].name) == 0
13486 && !cpu_flags_all_zero (&cpu_arch[j].enable))
6305a203 13487 {
33eaf5de 13488 /* ISA extension. */
6305a203 13489 i386_cpu_flags flags;
309d3373 13490
293f5f65 13491 flags = cpu_flags_or (cpu_arch_flags,
ae89daec 13492 cpu_arch[j].enable);
81486035 13493
5b64d091 13494 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
6305a203 13495 {
ae89daec 13496 extend_cpu_sub_arch_name (arch);
6305a203 13497 cpu_arch_flags = flags;
a586129e 13498 cpu_arch_isa_flags = flags;
6305a203 13499 }
0089dace
L
13500 else
13501 cpu_arch_isa_flags
13502 = cpu_flags_or (cpu_arch_isa_flags,
ae89daec 13503 cpu_arch[j].enable);
6305a203 13504 break;
ccc9c027 13505 }
9103f4f4 13506 }
6305a203 13507
ae89daec 13508 if (j >= ARRAY_SIZE (cpu_arch) && startswith (arch, "no"))
293f5f65 13509 {
33eaf5de 13510 /* Disable an ISA extension. */
ae89daec
JB
13511 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13512 if (cpu_arch[j].type == PROCESSOR_NONE
13513 && strcmp (arch + 2, cpu_arch[j].name) == 0)
293f5f65
L
13514 {
13515 i386_cpu_flags flags;
13516
13517 flags = cpu_flags_and_not (cpu_arch_flags,
ae89daec 13518 cpu_arch[j].disable);
293f5f65
L
13519 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13520 {
8180707f 13521 extend_cpu_sub_arch_name (arch);
293f5f65
L
13522 cpu_arch_flags = flags;
13523 cpu_arch_isa_flags = flags;
13524 }
13525 break;
13526 }
293f5f65
L
13527 }
13528
91d6fa6a 13529 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 13530 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
13531
13532 arch = next;
9103f4f4 13533 }
293f5f65
L
13534 while (next != NULL);
13535 free (saved);
9103f4f4
L
13536 break;
13537
13538 case OPTION_MTUNE:
13539 if (*arg == '.')
2b5d6a91 13540 as_fatal (_("invalid -mtune= option: `%s'"), arg);
91d6fa6a 13541 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 13542 {
ae89daec
JB
13543 if (cpu_arch[j].type != PROCESSOR_NONE
13544 && strcmp (arg, cpu_arch[j].name) == 0)
9103f4f4 13545 {
ccc9c027 13546 cpu_arch_tune_set = 1;
91d6fa6a 13547 cpu_arch_tune = cpu_arch [j].type;
ae89daec 13548 cpu_arch_tune_flags = cpu_arch[j].enable;
9103f4f4
L
13549 break;
13550 }
13551 }
91d6fa6a 13552 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 13553 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9103f4f4
L
13554 break;
13555
1efbbeb4
L
13556 case OPTION_MMNEMONIC:
13557 if (strcasecmp (arg, "att") == 0)
13558 intel_mnemonic = 0;
13559 else if (strcasecmp (arg, "intel") == 0)
13560 intel_mnemonic = 1;
13561 else
2b5d6a91 13562 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
1efbbeb4
L
13563 break;
13564
13565 case OPTION_MSYNTAX:
13566 if (strcasecmp (arg, "att") == 0)
13567 intel_syntax = 0;
13568 else if (strcasecmp (arg, "intel") == 0)
13569 intel_syntax = 1;
13570 else
2b5d6a91 13571 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
1efbbeb4
L
13572 break;
13573
13574 case OPTION_MINDEX_REG:
13575 allow_index_reg = 1;
13576 break;
13577
13578 case OPTION_MNAKED_REG:
13579 allow_naked_reg = 1;
13580 break;
13581
c0f3af97
L
13582 case OPTION_MSSE2AVX:
13583 sse2avx = 1;
13584 break;
13585
c8480b58
L
13586 case OPTION_MUSE_UNALIGNED_VECTOR_MOVE:
13587 use_unaligned_vector_move = 1;
13588 break;
13589
daf50ae7
L
13590 case OPTION_MSSE_CHECK:
13591 if (strcasecmp (arg, "error") == 0)
7bab8ab5 13592 sse_check = check_error;
daf50ae7 13593 else if (strcasecmp (arg, "warning") == 0)
7bab8ab5 13594 sse_check = check_warning;
daf50ae7 13595 else if (strcasecmp (arg, "none") == 0)
7bab8ab5 13596 sse_check = check_none;
daf50ae7 13597 else
2b5d6a91 13598 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
daf50ae7
L
13599 break;
13600
7bab8ab5
JB
13601 case OPTION_MOPERAND_CHECK:
13602 if (strcasecmp (arg, "error") == 0)
13603 operand_check = check_error;
13604 else if (strcasecmp (arg, "warning") == 0)
13605 operand_check = check_warning;
13606 else if (strcasecmp (arg, "none") == 0)
13607 operand_check = check_none;
13608 else
13609 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13610 break;
13611
539f890d
L
13612 case OPTION_MAVXSCALAR:
13613 if (strcasecmp (arg, "128") == 0)
13614 avxscalar = vex128;
13615 else if (strcasecmp (arg, "256") == 0)
13616 avxscalar = vex256;
13617 else
2b5d6a91 13618 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
539f890d
L
13619 break;
13620
03751133
L
13621 case OPTION_MVEXWIG:
13622 if (strcmp (arg, "0") == 0)
40c9c8de 13623 vexwig = vexw0;
03751133 13624 else if (strcmp (arg, "1") == 0)
40c9c8de 13625 vexwig = vexw1;
03751133
L
13626 else
13627 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13628 break;
13629
7e8b059b
L
13630 case OPTION_MADD_BND_PREFIX:
13631 add_bnd_prefix = 1;
13632 break;
13633
43234a1e
L
13634 case OPTION_MEVEXLIG:
13635 if (strcmp (arg, "128") == 0)
13636 evexlig = evexl128;
13637 else if (strcmp (arg, "256") == 0)
13638 evexlig = evexl256;
13639 else if (strcmp (arg, "512") == 0)
13640 evexlig = evexl512;
13641 else
13642 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13643 break;
13644
d3d3c6db
IT
13645 case OPTION_MEVEXRCIG:
13646 if (strcmp (arg, "rne") == 0)
13647 evexrcig = rne;
13648 else if (strcmp (arg, "rd") == 0)
13649 evexrcig = rd;
13650 else if (strcmp (arg, "ru") == 0)
13651 evexrcig = ru;
13652 else if (strcmp (arg, "rz") == 0)
13653 evexrcig = rz;
13654 else
13655 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13656 break;
13657
43234a1e
L
13658 case OPTION_MEVEXWIG:
13659 if (strcmp (arg, "0") == 0)
13660 evexwig = evexw0;
13661 else if (strcmp (arg, "1") == 0)
13662 evexwig = evexw1;
13663 else
13664 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13665 break;
13666
167ad85b
TG
13667# if defined (TE_PE) || defined (TE_PEP)
13668 case OPTION_MBIG_OBJ:
13669 use_big_obj = 1;
13670 break;
13671#endif
13672
d1982f93 13673 case OPTION_MOMIT_LOCK_PREFIX:
d022bddd
IT
13674 if (strcasecmp (arg, "yes") == 0)
13675 omit_lock_prefix = 1;
13676 else if (strcasecmp (arg, "no") == 0)
13677 omit_lock_prefix = 0;
13678 else
13679 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13680 break;
13681
e4e00185
AS
13682 case OPTION_MFENCE_AS_LOCK_ADD:
13683 if (strcasecmp (arg, "yes") == 0)
13684 avoid_fence = 1;
13685 else if (strcasecmp (arg, "no") == 0)
13686 avoid_fence = 0;
13687 else
13688 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13689 break;
13690
ae531041
L
13691 case OPTION_MLFENCE_AFTER_LOAD:
13692 if (strcasecmp (arg, "yes") == 0)
13693 lfence_after_load = 1;
13694 else if (strcasecmp (arg, "no") == 0)
13695 lfence_after_load = 0;
13696 else
13697 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13698 break;
13699
13700 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13701 if (strcasecmp (arg, "all") == 0)
a09f656b 13702 {
13703 lfence_before_indirect_branch = lfence_branch_all;
13704 if (lfence_before_ret == lfence_before_ret_none)
13705 lfence_before_ret = lfence_before_ret_shl;
13706 }
ae531041
L
13707 else if (strcasecmp (arg, "memory") == 0)
13708 lfence_before_indirect_branch = lfence_branch_memory;
13709 else if (strcasecmp (arg, "register") == 0)
13710 lfence_before_indirect_branch = lfence_branch_register;
13711 else if (strcasecmp (arg, "none") == 0)
13712 lfence_before_indirect_branch = lfence_branch_none;
13713 else
13714 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13715 arg);
13716 break;
13717
13718 case OPTION_MLFENCE_BEFORE_RET:
13719 if (strcasecmp (arg, "or") == 0)
13720 lfence_before_ret = lfence_before_ret_or;
13721 else if (strcasecmp (arg, "not") == 0)
13722 lfence_before_ret = lfence_before_ret_not;
a09f656b 13723 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13724 lfence_before_ret = lfence_before_ret_shl;
ae531041
L
13725 else if (strcasecmp (arg, "none") == 0)
13726 lfence_before_ret = lfence_before_ret_none;
13727 else
13728 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13729 arg);
13730 break;
13731
0cb4071e
L
13732 case OPTION_MRELAX_RELOCATIONS:
13733 if (strcasecmp (arg, "yes") == 0)
13734 generate_relax_relocations = 1;
13735 else if (strcasecmp (arg, "no") == 0)
13736 generate_relax_relocations = 0;
13737 else
13738 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13739 break;
13740
e379e5f3
L
13741 case OPTION_MALIGN_BRANCH_BOUNDARY:
13742 {
13743 char *end;
13744 long int align = strtoul (arg, &end, 0);
13745 if (*end == '\0')
13746 {
13747 if (align == 0)
13748 {
13749 align_branch_power = 0;
13750 break;
13751 }
13752 else if (align >= 16)
13753 {
13754 int align_power;
13755 for (align_power = 0;
13756 (align & 1) == 0;
13757 align >>= 1, align_power++)
13758 continue;
13759 /* Limit alignment power to 31. */
13760 if (align == 1 && align_power < 32)
13761 {
13762 align_branch_power = align_power;
13763 break;
13764 }
13765 }
13766 }
13767 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13768 }
13769 break;
13770
13771 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13772 {
13773 char *end;
13774 int align = strtoul (arg, &end, 0);
13775 /* Some processors only support 5 prefixes. */
13776 if (*end == '\0' && align >= 0 && align < 6)
13777 {
13778 align_branch_prefix_size = align;
13779 break;
13780 }
13781 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13782 arg);
13783 }
13784 break;
13785
13786 case OPTION_MALIGN_BRANCH:
13787 align_branch = 0;
13788 saved = xstrdup (arg);
13789 type = saved;
13790 do
13791 {
13792 next = strchr (type, '+');
13793 if (next)
13794 *next++ = '\0';
13795 if (strcasecmp (type, "jcc") == 0)
13796 align_branch |= align_branch_jcc_bit;
13797 else if (strcasecmp (type, "fused") == 0)
13798 align_branch |= align_branch_fused_bit;
13799 else if (strcasecmp (type, "jmp") == 0)
13800 align_branch |= align_branch_jmp_bit;
13801 else if (strcasecmp (type, "call") == 0)
13802 align_branch |= align_branch_call_bit;
13803 else if (strcasecmp (type, "ret") == 0)
13804 align_branch |= align_branch_ret_bit;
13805 else if (strcasecmp (type, "indirect") == 0)
13806 align_branch |= align_branch_indirect_bit;
13807 else
13808 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13809 type = next;
13810 }
13811 while (next != NULL);
13812 free (saved);
13813 break;
13814
76cf450b
L
13815 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13816 align_branch_power = 5;
13817 align_branch_prefix_size = 5;
13818 align_branch = (align_branch_jcc_bit
13819 | align_branch_fused_bit
13820 | align_branch_jmp_bit);
13821 break;
13822
5db04b09 13823 case OPTION_MAMD64:
4b5aaf5f 13824 isa64 = amd64;
5db04b09
L
13825 break;
13826
13827 case OPTION_MINTEL64:
4b5aaf5f 13828 isa64 = intel64;
5db04b09
L
13829 break;
13830
b6f8c7c4
L
13831 case 'O':
13832 if (arg == NULL)
13833 {
13834 optimize = 1;
13835 /* Turn off -Os. */
13836 optimize_for_space = 0;
13837 }
13838 else if (*arg == 's')
13839 {
13840 optimize_for_space = 1;
13841 /* Turn on all encoding optimizations. */
41fd2579 13842 optimize = INT_MAX;
b6f8c7c4
L
13843 }
13844 else
13845 {
13846 optimize = atoi (arg);
13847 /* Turn off -Os. */
13848 optimize_for_space = 0;
13849 }
13850 break;
13851
252b5132
RH
13852 default:
13853 return 0;
13854 }
13855 return 1;
13856}
13857
8a2c8fef
L
13858#define MESSAGE_TEMPLATE \
13859" "
13860
293f5f65
L
13861static char *
13862output_message (FILE *stream, char *p, char *message, char *start,
13863 int *left_p, const char *name, int len)
13864{
13865 int size = sizeof (MESSAGE_TEMPLATE);
13866 int left = *left_p;
13867
13868 /* Reserve 2 spaces for ", " or ",\0" */
13869 left -= len + 2;
13870
13871 /* Check if there is any room. */
13872 if (left >= 0)
13873 {
13874 if (p != start)
13875 {
13876 *p++ = ',';
13877 *p++ = ' ';
13878 }
13879 p = mempcpy (p, name, len);
13880 }
13881 else
13882 {
13883 /* Output the current message now and start a new one. */
13884 *p++ = ',';
13885 *p = '\0';
13886 fprintf (stream, "%s\n", message);
13887 p = start;
13888 left = size - (start - message) - len - 2;
13889
13890 gas_assert (left >= 0);
13891
13892 p = mempcpy (p, name, len);
13893 }
13894
13895 *left_p = left;
13896 return p;
13897}
13898
8a2c8fef 13899static void
1ded5609 13900show_arch (FILE *stream, int ext, int check)
8a2c8fef
L
13901{
13902 static char message[] = MESSAGE_TEMPLATE;
13903 char *start = message + 27;
13904 char *p;
13905 int size = sizeof (MESSAGE_TEMPLATE);
13906 int left;
13907 const char *name;
13908 int len;
13909 unsigned int j;
13910
13911 p = start;
13912 left = size - (start - message);
3ce2ebcf
JB
13913
13914 if (!ext && check)
13915 {
13916 p = output_message (stream, p, message, start, &left,
13917 STRING_COMMA_LEN ("default"));
f68697e8
JB
13918 p = output_message (stream, p, message, start, &left,
13919 STRING_COMMA_LEN ("push"));
13920 p = output_message (stream, p, message, start, &left,
13921 STRING_COMMA_LEN ("pop"));
3ce2ebcf
JB
13922 }
13923
8a2c8fef
L
13924 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13925 {
13926 /* Should it be skipped? */
13927 if (cpu_arch [j].skip)
13928 continue;
13929
13930 name = cpu_arch [j].name;
13931 len = cpu_arch [j].len;
ae89daec 13932 if (cpu_arch[j].type == PROCESSOR_NONE)
8a2c8fef
L
13933 {
13934 /* It is an extension. Skip if we aren't asked to show it. */
ae89daec 13935 if (!ext || cpu_flags_all_zero (&cpu_arch[j].enable))
8a2c8fef
L
13936 continue;
13937 }
13938 else if (ext)
13939 {
13940 /* It is an processor. Skip if we show only extension. */
13941 continue;
13942 }
ae89daec 13943 else if (check && ! cpu_arch[j].enable.bitfield.cpui386)
1ded5609
JB
13944 {
13945 /* It is an impossible processor - skip. */
13946 continue;
13947 }
8a2c8fef 13948
293f5f65 13949 p = output_message (stream, p, message, start, &left, name, len);
8a2c8fef
L
13950 }
13951
293f5f65
L
13952 /* Display disabled extensions. */
13953 if (ext)
ae89daec 13954 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
293f5f65 13955 {
ae89daec
JB
13956 char *str;
13957
13958 if (cpu_arch[j].type != PROCESSOR_NONE
13959 || !cpu_flags_all_zero (&cpu_arch[j].enable))
13960 continue;
13961 str = xasprintf ("no%s", cpu_arch[j].name);
13962 p = output_message (stream, p, message, start, &left, str,
13963 strlen (str));
13964 free (str);
293f5f65
L
13965 }
13966
8a2c8fef
L
13967 *p = '\0';
13968 fprintf (stream, "%s\n", message);
13969}
13970
252b5132 13971void
8a2c8fef 13972md_show_usage (FILE *stream)
252b5132 13973{
4cc782b5
ILT
13974#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13975 fprintf (stream, _("\
d4693039 13976 -Qy, -Qn ignored\n\
a38cf1db 13977 -V print assembler version number\n\
b3b91714
AM
13978 -k ignored\n"));
13979#endif
13980 fprintf (stream, _("\
7ebd68d1
NC
13981 -n do not optimize code alignment\n\
13982 -O{012s} attempt some code optimizations\n\
b3b91714
AM
13983 -q quieten some warnings\n"));
13984#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13985 fprintf (stream, _("\
a38cf1db 13986 -s ignored\n"));
b3b91714 13987#endif
b00af7c8
JB
13988#ifdef BFD64
13989# if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13990 fprintf (stream, _("\
13991 --32/--64/--x32 generate 32bit/64bit/x32 object\n"));
13992# elif defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O)
751d281c 13993 fprintf (stream, _("\
b00af7c8
JB
13994 --32/--64 generate 32bit/64bit object\n"));
13995# endif
751d281c 13996#endif
b3b91714
AM
13997#ifdef SVR4_COMMENT_CHARS
13998 fprintf (stream, _("\
13999 --divide do not treat `/' as a comment character\n"));
a38cf1db
AM
14000#else
14001 fprintf (stream, _("\
b3b91714 14002 --divide ignored\n"));
4cc782b5 14003#endif
9103f4f4 14004 fprintf (stream, _("\
6305a203 14005 -march=CPU[,+EXTENSION...]\n\
8a2c8fef 14006 generate code for CPU and EXTENSION, CPU is one of:\n"));
1ded5609 14007 show_arch (stream, 0, 1);
8a2c8fef 14008 fprintf (stream, _("\
ae89daec 14009 EXTENSION is combination of (possibly \"no\"-prefixed):\n"));
1ded5609 14010 show_arch (stream, 1, 0);
6305a203 14011 fprintf (stream, _("\
8a2c8fef 14012 -mtune=CPU optimize for CPU, CPU is one of:\n"));
1ded5609 14013 show_arch (stream, 0, 0);
ba104c83 14014 fprintf (stream, _("\
c0f3af97
L
14015 -msse2avx encode SSE instructions with VEX prefix\n"));
14016 fprintf (stream, _("\
c8480b58
L
14017 -muse-unaligned-vector-move\n\
14018 encode aligned vector move as unaligned vector move\n"));
14019 fprintf (stream, _("\
7c5c05ef 14020 -msse-check=[none|error|warning] (default: warning)\n\
daf50ae7
L
14021 check SSE instructions\n"));
14022 fprintf (stream, _("\
7c5c05ef 14023 -moperand-check=[none|error|warning] (default: warning)\n\
7bab8ab5
JB
14024 check operand combinations for validity\n"));
14025 fprintf (stream, _("\
7c5c05ef
L
14026 -mavxscalar=[128|256] (default: 128)\n\
14027 encode scalar AVX instructions with specific vector\n\
539f890d
L
14028 length\n"));
14029 fprintf (stream, _("\
03751133
L
14030 -mvexwig=[0|1] (default: 0)\n\
14031 encode VEX instructions with specific VEX.W value\n\
14032 for VEX.W bit ignored instructions\n"));
14033 fprintf (stream, _("\
7c5c05ef
L
14034 -mevexlig=[128|256|512] (default: 128)\n\
14035 encode scalar EVEX instructions with specific vector\n\
43234a1e
L
14036 length\n"));
14037 fprintf (stream, _("\
7c5c05ef
L
14038 -mevexwig=[0|1] (default: 0)\n\
14039 encode EVEX instructions with specific EVEX.W value\n\
43234a1e
L
14040 for EVEX.W bit ignored instructions\n"));
14041 fprintf (stream, _("\
7c5c05ef 14042 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
d3d3c6db
IT
14043 encode EVEX instructions with specific EVEX.RC value\n\
14044 for SAE-only ignored instructions\n"));
14045 fprintf (stream, _("\
7c5c05ef
L
14046 -mmnemonic=[att|intel] "));
14047 if (SYSV386_COMPAT)
14048 fprintf (stream, _("(default: att)\n"));
14049 else
14050 fprintf (stream, _("(default: intel)\n"));
14051 fprintf (stream, _("\
14052 use AT&T/Intel mnemonic\n"));
ba104c83 14053 fprintf (stream, _("\
7c5c05ef
L
14054 -msyntax=[att|intel] (default: att)\n\
14055 use AT&T/Intel syntax\n"));
ba104c83
L
14056 fprintf (stream, _("\
14057 -mindex-reg support pseudo index registers\n"));
14058 fprintf (stream, _("\
14059 -mnaked-reg don't require `%%' prefix for registers\n"));
14060 fprintf (stream, _("\
7e8b059b 14061 -madd-bnd-prefix add BND prefix for all valid branches\n"));
b4a3a7b4 14062#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8dcea932
L
14063 fprintf (stream, _("\
14064 -mshared disable branch optimization for shared code\n"));
b4a3a7b4
L
14065 fprintf (stream, _("\
14066 -mx86-used-note=[no|yes] "));
14067 if (DEFAULT_X86_USED_NOTE)
14068 fprintf (stream, _("(default: yes)\n"));
14069 else
14070 fprintf (stream, _("(default: no)\n"));
14071 fprintf (stream, _("\
14072 generate x86 used ISA and feature properties\n"));
14073#endif
14074#if defined (TE_PE) || defined (TE_PEP)
167ad85b
TG
14075 fprintf (stream, _("\
14076 -mbig-obj generate big object files\n"));
14077#endif
d022bddd 14078 fprintf (stream, _("\
7c5c05ef 14079 -momit-lock-prefix=[no|yes] (default: no)\n\
d022bddd 14080 strip all lock prefixes\n"));
5db04b09 14081 fprintf (stream, _("\
7c5c05ef 14082 -mfence-as-lock-add=[no|yes] (default: no)\n\
e4e00185
AS
14083 encode lfence, mfence and sfence as\n\
14084 lock addl $0x0, (%%{re}sp)\n"));
14085 fprintf (stream, _("\
7c5c05ef
L
14086 -mrelax-relocations=[no|yes] "));
14087 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
14088 fprintf (stream, _("(default: yes)\n"));
14089 else
14090 fprintf (stream, _("(default: no)\n"));
14091 fprintf (stream, _("\
0cb4071e
L
14092 generate relax relocations\n"));
14093 fprintf (stream, _("\
e379e5f3
L
14094 -malign-branch-boundary=NUM (default: 0)\n\
14095 align branches within NUM byte boundary\n"));
14096 fprintf (stream, _("\
14097 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
14098 TYPE is combination of jcc, fused, jmp, call, ret,\n\
14099 indirect\n\
14100 specify types of branches to align\n"));
14101 fprintf (stream, _("\
14102 -malign-branch-prefix-size=NUM (default: 5)\n\
14103 align branches with NUM prefixes per instruction\n"));
14104 fprintf (stream, _("\
76cf450b
L
14105 -mbranches-within-32B-boundaries\n\
14106 align branches within 32 byte boundary\n"));
14107 fprintf (stream, _("\
ae531041
L
14108 -mlfence-after-load=[no|yes] (default: no)\n\
14109 generate lfence after load\n"));
14110 fprintf (stream, _("\
14111 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
14112 generate lfence before indirect near branch\n"));
14113 fprintf (stream, _("\
a09f656b 14114 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
ae531041
L
14115 generate lfence before ret\n"));
14116 fprintf (stream, _("\
7c5c05ef 14117 -mamd64 accept only AMD64 ISA [default]\n"));
5db04b09
L
14118 fprintf (stream, _("\
14119 -mintel64 accept only Intel64 ISA\n"));
252b5132
RH
14120}
14121
3e73aa7c 14122#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
321098a5 14123 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
e57f8c65 14124 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
252b5132
RH
14125
14126/* Pick the target format to use. */
14127
47926f60 14128const char *
e3bb37b5 14129i386_target_format (void)
252b5132 14130{
d34049e8 14131 if (startswith (default_arch, "x86_64"))
351f65ca
L
14132 {
14133 update_code_flag (CODE_64BIT, 1);
14134 if (default_arch[6] == '\0')
7f56bc95 14135 x86_elf_abi = X86_64_ABI;
351f65ca 14136 else
7f56bc95 14137 x86_elf_abi = X86_64_X32_ABI;
351f65ca 14138 }
3e73aa7c 14139 else if (!strcmp (default_arch, "i386"))
78f12dd3 14140 update_code_flag (CODE_32BIT, 1);
5197d474
L
14141 else if (!strcmp (default_arch, "iamcu"))
14142 {
14143 update_code_flag (CODE_32BIT, 1);
14144 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
14145 {
14146 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
14147 cpu_arch_name = "iamcu";
d92c7521 14148 free (cpu_sub_arch_name);
5197d474
L
14149 cpu_sub_arch_name = NULL;
14150 cpu_arch_flags = iamcu_flags;
14151 cpu_arch_isa = PROCESSOR_IAMCU;
14152 cpu_arch_isa_flags = iamcu_flags;
14153 if (!cpu_arch_tune_set)
14154 {
14155 cpu_arch_tune = cpu_arch_isa;
14156 cpu_arch_tune_flags = cpu_arch_isa_flags;
14157 }
14158 }
8d471ec1 14159 else if (cpu_arch_isa != PROCESSOR_IAMCU)
5197d474
L
14160 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
14161 cpu_arch_name);
14162 }
3e73aa7c 14163 else
2b5d6a91 14164 as_fatal (_("unknown architecture"));
89507696
JB
14165
14166 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
ae89daec 14167 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].enable;
89507696 14168 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
ae89daec 14169 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].enable;
89507696 14170
252b5132
RH
14171 switch (OUTPUT_FLAVOR)
14172 {
9384f2ff 14173#if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
4c63da97 14174 case bfd_target_aout_flavour:
47926f60 14175 return AOUT_TARGET_FORMAT;
4c63da97 14176#endif
9384f2ff
AM
14177#if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
14178# if defined (TE_PE) || defined (TE_PEP)
14179 case bfd_target_coff_flavour:
167ad85b 14180 if (flag_code == CODE_64BIT)
eb19308f
JB
14181 {
14182 object_64bit = 1;
14183 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
14184 }
14185 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
9384f2ff 14186# elif defined (TE_GO32)
0561d57c
JK
14187 case bfd_target_coff_flavour:
14188 return "coff-go32";
9384f2ff 14189# else
252b5132
RH
14190 case bfd_target_coff_flavour:
14191 return "coff-i386";
9384f2ff 14192# endif
4c63da97 14193#endif
3e73aa7c 14194#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
252b5132 14195 case bfd_target_elf_flavour:
3e73aa7c 14196 {
351f65ca
L
14197 const char *format;
14198
14199 switch (x86_elf_abi)
4fa24527 14200 {
351f65ca
L
14201 default:
14202 format = ELF_TARGET_FORMAT;
e379e5f3
L
14203#ifndef TE_SOLARIS
14204 tls_get_addr = "___tls_get_addr";
14205#endif
351f65ca 14206 break;
7f56bc95 14207 case X86_64_ABI:
351f65ca 14208 use_rela_relocations = 1;
4fa24527 14209 object_64bit = 1;
e379e5f3
L
14210#ifndef TE_SOLARIS
14211 tls_get_addr = "__tls_get_addr";
14212#endif
351f65ca
L
14213 format = ELF_TARGET_FORMAT64;
14214 break;
7f56bc95 14215 case X86_64_X32_ABI:
4fa24527 14216 use_rela_relocations = 1;
351f65ca 14217 object_64bit = 1;
e379e5f3
L
14218#ifndef TE_SOLARIS
14219 tls_get_addr = "__tls_get_addr";
14220#endif
862be3fb 14221 disallow_64bit_reloc = 1;
351f65ca
L
14222 format = ELF_TARGET_FORMAT32;
14223 break;
4fa24527 14224 }
c085ab00 14225 if (cpu_arch_isa == PROCESSOR_IAMCU)
81486035
L
14226 {
14227 if (x86_elf_abi != I386_ABI)
14228 as_fatal (_("Intel MCU is 32bit only"));
14229 return ELF_TARGET_IAMCU_FORMAT;
14230 }
8a9036a4 14231 else
351f65ca 14232 return format;
3e73aa7c 14233 }
e57f8c65
TG
14234#endif
14235#if defined (OBJ_MACH_O)
14236 case bfd_target_mach_o_flavour:
d382c579
TG
14237 if (flag_code == CODE_64BIT)
14238 {
14239 use_rela_relocations = 1;
14240 object_64bit = 1;
14241 return "mach-o-x86-64";
14242 }
14243 else
14244 return "mach-o-i386";
4c63da97 14245#endif
252b5132
RH
14246 default:
14247 abort ();
14248 return NULL;
14249 }
14250}
14251
47926f60 14252#endif /* OBJ_MAYBE_ more than one */
252b5132 14253\f
252b5132 14254symbolS *
7016a5d5 14255md_undefined_symbol (char *name)
252b5132 14256{
18dc2407
ILT
14257 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
14258 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
14259 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
14260 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
24eab124
AM
14261 {
14262 if (!GOT_symbol)
14263 {
14264 if (symbol_find (name))
14265 as_bad (_("GOT already in symbol table"));
14266 GOT_symbol = symbol_new (name, undefined_section,
e01e1cee 14267 &zero_address_frag, 0);
24eab124
AM
14268 };
14269 return GOT_symbol;
14270 }
252b5132
RH
14271 return 0;
14272}
14273
14274/* Round up a section size to the appropriate boundary. */
47926f60 14275
252b5132 14276valueT
7016a5d5 14277md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
252b5132 14278{
4c63da97
AM
14279#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
14280 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
14281 {
14282 /* For a.out, force the section size to be aligned. If we don't do
14283 this, BFD will align it for us, but it will not write out the
14284 final bytes of the section. This may be a bug in BFD, but it is
14285 easier to fix it here since that is how the other a.out targets
14286 work. */
14287 int align;
14288
fd361982 14289 align = bfd_section_alignment (segment);
8d3842cd 14290 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
4c63da97 14291 }
252b5132
RH
14292#endif
14293
14294 return size;
14295}
14296
14297/* On the i386, PC-relative offsets are relative to the start of the
14298 next instruction. That is, the address of the offset, plus its
14299 size, since the offset is always the last part of the insn. */
14300
14301long
e3bb37b5 14302md_pcrel_from (fixS *fixP)
252b5132
RH
14303{
14304 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
14305}
14306
14307#ifndef I386COFF
14308
14309static void
e3bb37b5 14310s_bss (int ignore ATTRIBUTE_UNUSED)
252b5132 14311{
29b0f896 14312 int temp;
252b5132 14313
8a75718c
JB
14314#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14315 if (IS_ELF)
14316 obj_elf_section_change_hook ();
14317#endif
252b5132
RH
14318 temp = get_absolute_expression ();
14319 subseg_set (bss_section, (subsegT) temp);
14320 demand_empty_rest_of_line ();
14321}
14322
14323#endif
14324
e379e5f3
L
14325/* Remember constant directive. */
14326
14327void
14328i386_cons_align (int ignore ATTRIBUTE_UNUSED)
14329{
14330 if (last_insn.kind != last_insn_directive
14331 && (bfd_section_flags (now_seg) & SEC_CODE))
14332 {
14333 last_insn.seg = now_seg;
14334 last_insn.kind = last_insn_directive;
14335 last_insn.name = "constant directive";
14336 last_insn.file = as_where (&last_insn.line);
ae531041
L
14337 if (lfence_before_ret != lfence_before_ret_none)
14338 {
14339 if (lfence_before_indirect_branch != lfence_branch_none)
14340 as_warn (_("constant directive skips -mlfence-before-ret "
14341 "and -mlfence-before-indirect-branch"));
14342 else
14343 as_warn (_("constant directive skips -mlfence-before-ret"));
14344 }
14345 else if (lfence_before_indirect_branch != lfence_branch_none)
14346 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
e379e5f3
L
14347 }
14348}
14349
3abbafc2 14350int
e3bb37b5 14351i386_validate_fix (fixS *fixp)
252b5132 14352{
e52a16f2
JB
14353 if (fixp->fx_addsy && S_GET_SEGMENT(fixp->fx_addsy) == reg_section)
14354 {
14355 reloc_howto_type *howto;
14356
14357 howto = bfd_reloc_type_lookup (stdoutput, fixp->fx_r_type);
14358 as_bad_where (fixp->fx_file, fixp->fx_line,
14359 _("invalid %s relocation against register"),
14360 howto ? howto->name : "<unknown>");
14361 return 0;
14362 }
14363
3abbafc2
JB
14364#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14365 if (fixp->fx_r_type == BFD_RELOC_SIZE32
14366 || fixp->fx_r_type == BFD_RELOC_SIZE64)
14367 return IS_ELF && fixp->fx_addsy
14368 && (!S_IS_DEFINED (fixp->fx_addsy)
14369 || S_IS_EXTERNAL (fixp->fx_addsy));
14370#endif
14371
02a86693 14372 if (fixp->fx_subsy)
252b5132 14373 {
02a86693 14374 if (fixp->fx_subsy == GOT_symbol)
23df1078 14375 {
02a86693
L
14376 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
14377 {
14378 if (!object_64bit)
14379 abort ();
14380#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14381 if (fixp->fx_tcbit2)
56ceb5b5
L
14382 fixp->fx_r_type = (fixp->fx_tcbit
14383 ? BFD_RELOC_X86_64_REX_GOTPCRELX
14384 : BFD_RELOC_X86_64_GOTPCRELX);
02a86693
L
14385 else
14386#endif
14387 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
14388 }
d6ab8113 14389 else
02a86693
L
14390 {
14391 if (!object_64bit)
14392 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
14393 else
14394 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
14395 }
14396 fixp->fx_subsy = 0;
23df1078 14397 }
252b5132 14398 }
02a86693 14399#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2585b7a5 14400 else
02a86693 14401 {
2585b7a5
L
14402 /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
14403 to section. Since PLT32 relocation must be against symbols,
14404 turn such PLT32 relocation into PC32 relocation. */
14405 if (fixp->fx_addsy
14406 && (fixp->fx_r_type == BFD_RELOC_386_PLT32
14407 || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
14408 && symbol_section_p (fixp->fx_addsy))
14409 fixp->fx_r_type = BFD_RELOC_32_PCREL;
14410 if (!object_64bit)
14411 {
14412 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
14413 && fixp->fx_tcbit2)
14414 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14415 }
02a86693
L
14416 }
14417#endif
3abbafc2
JB
14418
14419 return 1;
252b5132
RH
14420}
14421
252b5132 14422arelent *
7016a5d5 14423tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
252b5132
RH
14424{
14425 arelent *rel;
14426 bfd_reloc_code_real_type code;
14427
14428 switch (fixp->fx_r_type)
14429 {
8ce3d284 14430#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3abbafc2
JB
14431 symbolS *sym;
14432
8fd4256d
L
14433 case BFD_RELOC_SIZE32:
14434 case BFD_RELOC_SIZE64:
3abbafc2
JB
14435 if (fixp->fx_addsy
14436 && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))
14437 && (!fixp->fx_subsy
14438 || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))))
14439 sym = fixp->fx_addsy;
14440 else if (fixp->fx_subsy
14441 && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))
14442 && (!fixp->fx_addsy
14443 || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))))
14444 sym = fixp->fx_subsy;
14445 else
14446 sym = NULL;
14447 if (IS_ELF && sym && S_IS_DEFINED (sym) && !S_IS_EXTERNAL (sym))
8fd4256d
L
14448 {
14449 /* Resolve size relocation against local symbol to size of
14450 the symbol plus addend. */
3abbafc2 14451 valueT value = S_GET_SIZE (sym);
44f87162 14452
3abbafc2
JB
14453 if (symbol_get_bfdsym (sym)->flags & BSF_SECTION_SYM)
14454 value = bfd_section_size (S_GET_SEGMENT (sym));
14455 if (sym == fixp->fx_subsy)
14456 {
14457 value = -value;
14458 if (fixp->fx_addsy)
14459 value += S_GET_VALUE (fixp->fx_addsy);
14460 }
14461 else if (fixp->fx_subsy)
14462 value -= S_GET_VALUE (fixp->fx_subsy);
44f87162 14463 value += fixp->fx_offset;
8fd4256d 14464 if (fixp->fx_r_type == BFD_RELOC_SIZE32
d965814f 14465 && object_64bit
8fd4256d
L
14466 && !fits_in_unsigned_long (value))
14467 as_bad_where (fixp->fx_file, fixp->fx_line,
14468 _("symbol size computation overflow"));
14469 fixp->fx_addsy = NULL;
14470 fixp->fx_subsy = NULL;
14471 md_apply_fix (fixp, (valueT *) &value, NULL);
14472 return NULL;
14473 }
3abbafc2
JB
14474 if (!fixp->fx_addsy || fixp->fx_subsy)
14475 {
14476 as_bad_where (fixp->fx_file, fixp->fx_line,
14477 "unsupported expression involving @size");
14478 return NULL;
14479 }
8ce3d284 14480#endif
1a0670f3 14481 /* Fall through. */
8fd4256d 14482
3e73aa7c
JH
14483 case BFD_RELOC_X86_64_PLT32:
14484 case BFD_RELOC_X86_64_GOT32:
14485 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
14486 case BFD_RELOC_X86_64_GOTPCRELX:
14487 case BFD_RELOC_X86_64_REX_GOTPCRELX:
252b5132
RH
14488 case BFD_RELOC_386_PLT32:
14489 case BFD_RELOC_386_GOT32:
02a86693 14490 case BFD_RELOC_386_GOT32X:
252b5132
RH
14491 case BFD_RELOC_386_GOTOFF:
14492 case BFD_RELOC_386_GOTPC:
13ae64f3
JJ
14493 case BFD_RELOC_386_TLS_GD:
14494 case BFD_RELOC_386_TLS_LDM:
14495 case BFD_RELOC_386_TLS_LDO_32:
14496 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
14497 case BFD_RELOC_386_TLS_IE:
14498 case BFD_RELOC_386_TLS_GOTIE:
13ae64f3
JJ
14499 case BFD_RELOC_386_TLS_LE_32:
14500 case BFD_RELOC_386_TLS_LE:
67a4f2b7
AO
14501 case BFD_RELOC_386_TLS_GOTDESC:
14502 case BFD_RELOC_386_TLS_DESC_CALL:
bffbf940
JJ
14503 case BFD_RELOC_X86_64_TLSGD:
14504 case BFD_RELOC_X86_64_TLSLD:
14505 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 14506 case BFD_RELOC_X86_64_DTPOFF64:
bffbf940
JJ
14507 case BFD_RELOC_X86_64_GOTTPOFF:
14508 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113
JB
14509 case BFD_RELOC_X86_64_TPOFF64:
14510 case BFD_RELOC_X86_64_GOTOFF64:
14511 case BFD_RELOC_X86_64_GOTPC32:
7b81dfbb
AJ
14512 case BFD_RELOC_X86_64_GOT64:
14513 case BFD_RELOC_X86_64_GOTPCREL64:
14514 case BFD_RELOC_X86_64_GOTPC64:
14515 case BFD_RELOC_X86_64_GOTPLT64:
14516 case BFD_RELOC_X86_64_PLTOFF64:
67a4f2b7
AO
14517 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14518 case BFD_RELOC_X86_64_TLSDESC_CALL:
252b5132
RH
14519 case BFD_RELOC_RVA:
14520 case BFD_RELOC_VTABLE_ENTRY:
14521 case BFD_RELOC_VTABLE_INHERIT:
6482c264
NC
14522#ifdef TE_PE
14523 case BFD_RELOC_32_SECREL:
145667f8 14524 case BFD_RELOC_16_SECIDX:
6482c264 14525#endif
252b5132
RH
14526 code = fixp->fx_r_type;
14527 break;
dbbaec26
L
14528 case BFD_RELOC_X86_64_32S:
14529 if (!fixp->fx_pcrel)
14530 {
14531 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
14532 code = fixp->fx_r_type;
14533 break;
14534 }
1a0670f3 14535 /* Fall through. */
252b5132 14536 default:
93382f6d 14537 if (fixp->fx_pcrel)
252b5132 14538 {
93382f6d
AM
14539 switch (fixp->fx_size)
14540 {
14541 default:
b091f402
AM
14542 as_bad_where (fixp->fx_file, fixp->fx_line,
14543 _("can not do %d byte pc-relative relocation"),
14544 fixp->fx_size);
93382f6d
AM
14545 code = BFD_RELOC_32_PCREL;
14546 break;
14547 case 1: code = BFD_RELOC_8_PCREL; break;
14548 case 2: code = BFD_RELOC_16_PCREL; break;
d258b828 14549 case 4: code = BFD_RELOC_32_PCREL; break;
d6ab8113
JB
14550#ifdef BFD64
14551 case 8: code = BFD_RELOC_64_PCREL; break;
14552#endif
93382f6d
AM
14553 }
14554 }
14555 else
14556 {
14557 switch (fixp->fx_size)
14558 {
14559 default:
b091f402
AM
14560 as_bad_where (fixp->fx_file, fixp->fx_line,
14561 _("can not do %d byte relocation"),
14562 fixp->fx_size);
93382f6d
AM
14563 code = BFD_RELOC_32;
14564 break;
14565 case 1: code = BFD_RELOC_8; break;
14566 case 2: code = BFD_RELOC_16; break;
14567 case 4: code = BFD_RELOC_32; break;
937149dd 14568#ifdef BFD64
3e73aa7c 14569 case 8: code = BFD_RELOC_64; break;
937149dd 14570#endif
93382f6d 14571 }
252b5132
RH
14572 }
14573 break;
14574 }
252b5132 14575
d182319b
JB
14576 if ((code == BFD_RELOC_32
14577 || code == BFD_RELOC_32_PCREL
14578 || code == BFD_RELOC_X86_64_32S)
252b5132
RH
14579 && GOT_symbol
14580 && fixp->fx_addsy == GOT_symbol)
3e73aa7c 14581 {
4fa24527 14582 if (!object_64bit)
d6ab8113
JB
14583 code = BFD_RELOC_386_GOTPC;
14584 else
14585 code = BFD_RELOC_X86_64_GOTPC32;
3e73aa7c 14586 }
7b81dfbb
AJ
14587 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14588 && GOT_symbol
14589 && fixp->fx_addsy == GOT_symbol)
14590 {
14591 code = BFD_RELOC_X86_64_GOTPC64;
14592 }
252b5132 14593
add39d23
TS
14594 rel = XNEW (arelent);
14595 rel->sym_ptr_ptr = XNEW (asymbol *);
49309057 14596 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
252b5132
RH
14597
14598 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
c87db184 14599
3e73aa7c
JH
14600 if (!use_rela_relocations)
14601 {
14602 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14603 vtable entry to be used in the relocation's section offset. */
14604 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14605 rel->address = fixp->fx_offset;
fbeb56a4
DK
14606#if defined (OBJ_COFF) && defined (TE_PE)
14607 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14608 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14609 else
14610#endif
c6682705 14611 rel->addend = 0;
3e73aa7c
JH
14612 }
14613 /* Use the rela in 64bit mode. */
252b5132 14614 else
3e73aa7c 14615 {
862be3fb
L
14616 if (disallow_64bit_reloc)
14617 switch (code)
14618 {
862be3fb
L
14619 case BFD_RELOC_X86_64_DTPOFF64:
14620 case BFD_RELOC_X86_64_TPOFF64:
14621 case BFD_RELOC_64_PCREL:
14622 case BFD_RELOC_X86_64_GOTOFF64:
14623 case BFD_RELOC_X86_64_GOT64:
14624 case BFD_RELOC_X86_64_GOTPCREL64:
14625 case BFD_RELOC_X86_64_GOTPC64:
14626 case BFD_RELOC_X86_64_GOTPLT64:
14627 case BFD_RELOC_X86_64_PLTOFF64:
14628 as_bad_where (fixp->fx_file, fixp->fx_line,
14629 _("cannot represent relocation type %s in x32 mode"),
14630 bfd_get_reloc_code_name (code));
14631 break;
14632 default:
14633 break;
14634 }
14635
062cd5e7
AS
14636 if (!fixp->fx_pcrel)
14637 rel->addend = fixp->fx_offset;
14638 else
14639 switch (code)
14640 {
14641 case BFD_RELOC_X86_64_PLT32:
14642 case BFD_RELOC_X86_64_GOT32:
14643 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
14644 case BFD_RELOC_X86_64_GOTPCRELX:
14645 case BFD_RELOC_X86_64_REX_GOTPCRELX:
bffbf940
JJ
14646 case BFD_RELOC_X86_64_TLSGD:
14647 case BFD_RELOC_X86_64_TLSLD:
14648 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7
AO
14649 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14650 case BFD_RELOC_X86_64_TLSDESC_CALL:
062cd5e7
AS
14651 rel->addend = fixp->fx_offset - fixp->fx_size;
14652 break;
14653 default:
14654 rel->addend = (section->vma
14655 - fixp->fx_size
14656 + fixp->fx_addnumber
14657 + md_pcrel_from (fixp));
14658 break;
14659 }
3e73aa7c
JH
14660 }
14661
252b5132
RH
14662 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14663 if (rel->howto == NULL)
14664 {
14665 as_bad_where (fixp->fx_file, fixp->fx_line,
d0b47220 14666 _("cannot represent relocation type %s"),
252b5132
RH
14667 bfd_get_reloc_code_name (code));
14668 /* Set howto to a garbage value so that we can keep going. */
14669 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
9c2799c2 14670 gas_assert (rel->howto != NULL);
252b5132
RH
14671 }
14672
14673 return rel;
14674}
14675
ee86248c 14676#include "tc-i386-intel.c"
54cfded0 14677
a60de03c
JB
14678void
14679tc_x86_parse_to_dw2regnum (expressionS *exp)
54cfded0 14680{
a60de03c
JB
14681 int saved_naked_reg;
14682 char saved_register_dot;
54cfded0 14683
a60de03c
JB
14684 saved_naked_reg = allow_naked_reg;
14685 allow_naked_reg = 1;
14686 saved_register_dot = register_chars['.'];
14687 register_chars['.'] = '.';
14688 allow_pseudo_reg = 1;
14689 expression_and_evaluate (exp);
14690 allow_pseudo_reg = 0;
14691 register_chars['.'] = saved_register_dot;
14692 allow_naked_reg = saved_naked_reg;
14693
e96d56a1 14694 if (exp->X_op == O_register && exp->X_add_number >= 0)
54cfded0 14695 {
a60de03c
JB
14696 if ((addressT) exp->X_add_number < i386_regtab_size)
14697 {
14698 exp->X_op = O_constant;
14699 exp->X_add_number = i386_regtab[exp->X_add_number]
14700 .dw2_regnum[flag_code >> 1];
14701 }
14702 else
14703 exp->X_op = O_illegal;
54cfded0 14704 }
54cfded0
AM
14705}
14706
14707void
14708tc_x86_frame_initial_instructions (void)
14709{
a60de03c
JB
14710 static unsigned int sp_regno[2];
14711
14712 if (!sp_regno[flag_code >> 1])
14713 {
14714 char *saved_input = input_line_pointer;
14715 char sp[][4] = {"esp", "rsp"};
14716 expressionS exp;
a4447b93 14717
a60de03c
JB
14718 input_line_pointer = sp[flag_code >> 1];
14719 tc_x86_parse_to_dw2regnum (&exp);
9c2799c2 14720 gas_assert (exp.X_op == O_constant);
a60de03c
JB
14721 sp_regno[flag_code >> 1] = exp.X_add_number;
14722 input_line_pointer = saved_input;
14723 }
a4447b93 14724
61ff971f
L
14725 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14726 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
54cfded0 14727}
d2b2c203 14728
d7921315
L
14729int
14730x86_dwarf2_addr_size (void)
14731{
14732#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14733 if (x86_elf_abi == X86_64_X32_ABI)
14734 return 4;
14735#endif
14736 return bfd_arch_bits_per_address (stdoutput) / 8;
14737}
14738
d2b2c203
DJ
14739int
14740i386_elf_section_type (const char *str, size_t len)
14741{
14742 if (flag_code == CODE_64BIT
14743 && len == sizeof ("unwind") - 1
d34049e8 14744 && startswith (str, "unwind"))
d2b2c203
DJ
14745 return SHT_X86_64_UNWIND;
14746
14747 return -1;
14748}
bb41ade5 14749
ad5fec3b
EB
14750#ifdef TE_SOLARIS
14751void
14752i386_solaris_fix_up_eh_frame (segT sec)
14753{
14754 if (flag_code == CODE_64BIT)
14755 elf_section_type (sec) = SHT_X86_64_UNWIND;
14756}
14757#endif
14758
bb41ade5
AM
14759#ifdef TE_PE
14760void
14761tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14762{
91d6fa6a 14763 expressionS exp;
bb41ade5 14764
91d6fa6a
NC
14765 exp.X_op = O_secrel;
14766 exp.X_add_symbol = symbol;
14767 exp.X_add_number = 0;
14768 emit_expr (&exp, size);
bb41ade5
AM
14769}
14770#endif
3b22753a
L
14771
14772#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14773/* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14774
01e1a5bc 14775bfd_vma
6d4af3c2 14776x86_64_section_letter (int letter, const char **ptr_msg)
3b22753a
L
14777{
14778 if (flag_code == CODE_64BIT)
14779 {
14780 if (letter == 'l')
14781 return SHF_X86_64_LARGE;
14782
8f3bae45 14783 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
64e74474 14784 }
3b22753a 14785 else
8f3bae45 14786 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
3b22753a
L
14787 return -1;
14788}
14789
01e1a5bc 14790bfd_vma
3b22753a
L
14791x86_64_section_word (char *str, size_t len)
14792{
08dedd66 14793 if (len == 5 && flag_code == CODE_64BIT && startswith (str, "large"))
3b22753a
L
14794 return SHF_X86_64_LARGE;
14795
14796 return -1;
14797}
14798
14799static void
14800handle_large_common (int small ATTRIBUTE_UNUSED)
14801{
14802 if (flag_code != CODE_64BIT)
14803 {
14804 s_comm_internal (0, elf_common_parse);
14805 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14806 }
14807 else
14808 {
14809 static segT lbss_section;
14810 asection *saved_com_section_ptr = elf_com_section_ptr;
14811 asection *saved_bss_section = bss_section;
14812
14813 if (lbss_section == NULL)
14814 {
14815 flagword applicable;
14816 segT seg = now_seg;
14817 subsegT subseg = now_subseg;
14818
14819 /* The .lbss section is for local .largecomm symbols. */
14820 lbss_section = subseg_new (".lbss", 0);
14821 applicable = bfd_applicable_section_flags (stdoutput);
fd361982 14822 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
3b22753a
L
14823 seg_info (lbss_section)->bss = 1;
14824
14825 subseg_set (seg, subseg);
14826 }
14827
14828 elf_com_section_ptr = &_bfd_elf_large_com_section;
14829 bss_section = lbss_section;
14830
14831 s_comm_internal (0, elf_common_parse);
14832
14833 elf_com_section_ptr = saved_com_section_ptr;
14834 bss_section = saved_bss_section;
14835 }
14836}
14837#endif /* OBJ_ELF || OBJ_MAYBE_ELF */