]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gas/config/tc-i386.c
x86: fold some prefix related attributes into a single one
[thirdparty/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2021 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_sib_address,
294 invalid_vsib_address,
295 invalid_vector_register_set,
296 invalid_tmm_register_set,
297 unsupported_vector_index_register,
298 unsupported_broadcast,
299 broadcast_needed,
300 unsupported_masking,
301 mask_not_on_destination,
302 no_default_mask,
303 unsupported_rc_sae,
304 rc_sae_operand_not_last_imm,
305 invalid_register_operand,
306 };
307
308 struct _i386_insn
309 {
310 /* TM holds the template for the insn were currently assembling. */
311 insn_template tm;
312
313 /* SUFFIX holds the instruction size suffix for byte, word, dword
314 or qword, if given. */
315 char suffix;
316
317 /* OPERANDS gives the number of given operands. */
318 unsigned int operands;
319
320 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
321 of given register, displacement, memory operands and immediate
322 operands. */
323 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
324
325 /* TYPES [i] is the type (see above #defines) which tells us how to
326 use OP[i] for the corresponding operand. */
327 i386_operand_type types[MAX_OPERANDS];
328
329 /* Displacement expression, immediate expression, or register for each
330 operand. */
331 union i386_op op[MAX_OPERANDS];
332
333 /* Flags for operands. */
334 unsigned int flags[MAX_OPERANDS];
335 #define Operand_PCrel 1
336 #define Operand_Mem 2
337
338 /* Relocation type for operand */
339 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
340
341 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
342 the base index byte below. */
343 const reg_entry *base_reg;
344 const reg_entry *index_reg;
345 unsigned int log2_scale_factor;
346
347 /* SEG gives the seg_entries of this insn. They are zero unless
348 explicit segment overrides are given. */
349 const seg_entry *seg[2];
350
351 /* Copied first memory operand string, for re-checking. */
352 char *memop1_string;
353
354 /* PREFIX holds all the given prefix opcodes (usually null).
355 PREFIXES is the number of prefix opcodes. */
356 unsigned int prefixes;
357 unsigned char prefix[MAX_PREFIXES];
358
359 /* Register is in low 3 bits of opcode. */
360 bfd_boolean short_form;
361
362 /* The operand to a branch insn indicates an absolute branch. */
363 bfd_boolean jumpabsolute;
364
365 /* Extended states. */
366 enum
367 {
368 /* Use MMX state. */
369 xstate_mmx = 1 << 0,
370 /* Use XMM state. */
371 xstate_xmm = 1 << 1,
372 /* Use YMM state. */
373 xstate_ymm = 1 << 2 | xstate_xmm,
374 /* Use ZMM state. */
375 xstate_zmm = 1 << 3 | xstate_ymm,
376 /* Use TMM state. */
377 xstate_tmm = 1 << 4,
378 /* Use MASK state. */
379 xstate_mask = 1 << 5
380 } xstate;
381
382 /* Has GOTPC or TLS relocation. */
383 bfd_boolean has_gotpc_tls_reloc;
384
385 /* RM and SIB are the modrm byte and the sib byte where the
386 addressing modes of this insn are encoded. */
387 modrm_byte rm;
388 rex_byte rex;
389 rex_byte vrex;
390 sib_byte sib;
391 vex_prefix vex;
392
393 /* Masking attributes. */
394 struct Mask_Operation *mask;
395
396 /* Rounding control and SAE attributes. */
397 struct RC_Operation *rounding;
398
399 /* Broadcasting attributes. */
400 struct Broadcast_Operation *broadcast;
401
402 /* Compressed disp8*N attribute. */
403 unsigned int memshift;
404
405 /* Prefer load or store in encoding. */
406 enum
407 {
408 dir_encoding_default = 0,
409 dir_encoding_load,
410 dir_encoding_store,
411 dir_encoding_swap
412 } dir_encoding;
413
414 /* Prefer 8bit, 16bit, 32bit displacement in encoding. */
415 enum
416 {
417 disp_encoding_default = 0,
418 disp_encoding_8bit,
419 disp_encoding_16bit,
420 disp_encoding_32bit
421 } disp_encoding;
422
423 /* Prefer the REX byte in encoding. */
424 bfd_boolean rex_encoding;
425
426 /* Disable instruction size optimization. */
427 bfd_boolean no_optimize;
428
429 /* How to encode vector instructions. */
430 enum
431 {
432 vex_encoding_default = 0,
433 vex_encoding_vex,
434 vex_encoding_vex3,
435 vex_encoding_evex,
436 vex_encoding_error
437 } vec_encoding;
438
439 /* REP prefix. */
440 const char *rep_prefix;
441
442 /* HLE prefix. */
443 const char *hle_prefix;
444
445 /* Have BND prefix. */
446 const char *bnd_prefix;
447
448 /* Have NOTRACK prefix. */
449 const char *notrack_prefix;
450
451 /* Error message. */
452 enum i386_error error;
453 };
454
455 typedef struct _i386_insn i386_insn;
456
457 /* Link RC type with corresponding string, that'll be looked for in
458 asm. */
459 struct RC_name
460 {
461 enum rc_type type;
462 const char *name;
463 unsigned int len;
464 };
465
466 static const struct RC_name RC_NamesTable[] =
467 {
468 { rne, STRING_COMMA_LEN ("rn-sae") },
469 { rd, STRING_COMMA_LEN ("rd-sae") },
470 { ru, STRING_COMMA_LEN ("ru-sae") },
471 { rz, STRING_COMMA_LEN ("rz-sae") },
472 { saeonly, STRING_COMMA_LEN ("sae") },
473 };
474
475 /* List of chars besides those in app.c:symbol_chars that can start an
476 operand. Used to prevent the scrubber eating vital white-space. */
477 const char extra_symbol_chars[] = "*%-([{}"
478 #ifdef LEX_AT
479 "@"
480 #endif
481 #ifdef LEX_QM
482 "?"
483 #endif
484 ;
485
486 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
487 && !defined (TE_GNU) \
488 && !defined (TE_LINUX) \
489 && !defined (TE_FreeBSD) \
490 && !defined (TE_DragonFly) \
491 && !defined (TE_NetBSD))
492 /* This array holds the chars that always start a comment. If the
493 pre-processor is disabled, these aren't very useful. The option
494 --divide will remove '/' from this list. */
495 const char *i386_comment_chars = "#/";
496 #define SVR4_COMMENT_CHARS 1
497 #define PREFIX_SEPARATOR '\\'
498
499 #else
500 const char *i386_comment_chars = "#";
501 #define PREFIX_SEPARATOR '/'
502 #endif
503
504 /* This array holds the chars that only start a comment at the beginning of
505 a line. If the line seems to have the form '# 123 filename'
506 .line and .file directives will appear in the pre-processed output.
507 Note that input_file.c hand checks for '#' at the beginning of the
508 first line of the input file. This is because the compiler outputs
509 #NO_APP at the beginning of its output.
510 Also note that comments started like this one will always work if
511 '/' isn't otherwise defined. */
512 const char line_comment_chars[] = "#/";
513
514 const char line_separator_chars[] = ";";
515
516 /* Chars that can be used to separate mant from exp in floating point
517 nums. */
518 const char EXP_CHARS[] = "eE";
519
520 /* Chars that mean this number is a floating point constant
521 As in 0f12.456
522 or 0d1.2345e12. */
523 const char FLT_CHARS[] = "fFdDxX";
524
525 /* Tables for lexical analysis. */
526 static char mnemonic_chars[256];
527 static char register_chars[256];
528 static char operand_chars[256];
529 static char identifier_chars[256];
530 static char digit_chars[256];
531
532 /* Lexical macros. */
533 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
534 #define is_operand_char(x) (operand_chars[(unsigned char) x])
535 #define is_register_char(x) (register_chars[(unsigned char) x])
536 #define is_space_char(x) ((x) == ' ')
537 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
538 #define is_digit_char(x) (digit_chars[(unsigned char) x])
539
540 /* All non-digit non-letter characters that may occur in an operand. */
541 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
542
543 /* md_assemble() always leaves the strings it's passed unaltered. To
544 effect this we maintain a stack of saved characters that we've smashed
545 with '\0's (indicating end of strings for various sub-fields of the
546 assembler instruction). */
547 static char save_stack[32];
548 static char *save_stack_p;
549 #define END_STRING_AND_SAVE(s) \
550 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
551 #define RESTORE_END_STRING(s) \
552 do { *(s) = *--save_stack_p; } while (0)
553
554 /* The instruction we're assembling. */
555 static i386_insn i;
556
557 /* Possible templates for current insn. */
558 static const templates *current_templates;
559
560 /* Per instruction expressionS buffers: max displacements & immediates. */
561 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
562 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
563
564 /* Current operand we are working on. */
565 static int this_operand = -1;
566
567 /* We support four different modes. FLAG_CODE variable is used to distinguish
568 these. */
569
570 enum flag_code {
571 CODE_32BIT,
572 CODE_16BIT,
573 CODE_64BIT };
574
575 static enum flag_code flag_code;
576 static unsigned int object_64bit;
577 static unsigned int disallow_64bit_reloc;
578 static int use_rela_relocations = 0;
579 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
580 static const char *tls_get_addr;
581
582 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
583 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
584 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
585
586 /* The ELF ABI to use. */
587 enum x86_elf_abi
588 {
589 I386_ABI,
590 X86_64_ABI,
591 X86_64_X32_ABI
592 };
593
594 static enum x86_elf_abi x86_elf_abi = I386_ABI;
595 #endif
596
597 #if defined (TE_PE) || defined (TE_PEP)
598 /* Use big object file format. */
599 static int use_big_obj = 0;
600 #endif
601
602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
603 /* 1 if generating code for a shared library. */
604 static int shared = 0;
605 #endif
606
607 /* 1 for intel syntax,
608 0 if att syntax. */
609 static int intel_syntax = 0;
610
611 static enum x86_64_isa
612 {
613 amd64 = 1, /* AMD64 ISA. */
614 intel64 /* Intel64 ISA. */
615 } isa64;
616
617 /* 1 for intel mnemonic,
618 0 if att mnemonic. */
619 static int intel_mnemonic = !SYSV386_COMPAT;
620
621 /* 1 if pseudo registers are permitted. */
622 static int allow_pseudo_reg = 0;
623
624 /* 1 if register prefix % not required. */
625 static int allow_naked_reg = 0;
626
627 /* 1 if the assembler should add BND prefix for all control-transferring
628 instructions supporting it, even if this prefix wasn't specified
629 explicitly. */
630 static int add_bnd_prefix = 0;
631
632 /* 1 if pseudo index register, eiz/riz, is allowed . */
633 static int allow_index_reg = 0;
634
635 /* 1 if the assembler should ignore LOCK prefix, even if it was
636 specified explicitly. */
637 static int omit_lock_prefix = 0;
638
639 /* 1 if the assembler should encode lfence, mfence, and sfence as
640 "lock addl $0, (%{re}sp)". */
641 static int avoid_fence = 0;
642
643 /* 1 if lfence should be inserted after every load. */
644 static int lfence_after_load = 0;
645
646 /* Non-zero if lfence should be inserted before indirect branch. */
647 static enum lfence_before_indirect_branch_kind
648 {
649 lfence_branch_none = 0,
650 lfence_branch_register,
651 lfence_branch_memory,
652 lfence_branch_all
653 }
654 lfence_before_indirect_branch;
655
656 /* Non-zero if lfence should be inserted before ret. */
657 static enum lfence_before_ret_kind
658 {
659 lfence_before_ret_none = 0,
660 lfence_before_ret_not,
661 lfence_before_ret_or,
662 lfence_before_ret_shl
663 }
664 lfence_before_ret;
665
666 /* Types of previous instruction is .byte or prefix. */
667 static struct
668 {
669 segT seg;
670 const char *file;
671 const char *name;
672 unsigned int line;
673 enum last_insn_kind
674 {
675 last_insn_other = 0,
676 last_insn_directive,
677 last_insn_prefix
678 } kind;
679 } last_insn;
680
681 /* 1 if the assembler should generate relax relocations. */
682
683 static int generate_relax_relocations
684 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
685
686 static enum check_kind
687 {
688 check_none = 0,
689 check_warning,
690 check_error
691 }
692 sse_check, operand_check = check_warning;
693
694 /* Non-zero if branches should be aligned within power of 2 boundary. */
695 static int align_branch_power = 0;
696
697 /* Types of branches to align. */
698 enum align_branch_kind
699 {
700 align_branch_none = 0,
701 align_branch_jcc = 1,
702 align_branch_fused = 2,
703 align_branch_jmp = 3,
704 align_branch_call = 4,
705 align_branch_indirect = 5,
706 align_branch_ret = 6
707 };
708
709 /* Type bits of branches to align. */
710 enum align_branch_bit
711 {
712 align_branch_jcc_bit = 1 << align_branch_jcc,
713 align_branch_fused_bit = 1 << align_branch_fused,
714 align_branch_jmp_bit = 1 << align_branch_jmp,
715 align_branch_call_bit = 1 << align_branch_call,
716 align_branch_indirect_bit = 1 << align_branch_indirect,
717 align_branch_ret_bit = 1 << align_branch_ret
718 };
719
720 static unsigned int align_branch = (align_branch_jcc_bit
721 | align_branch_fused_bit
722 | align_branch_jmp_bit);
723
724 /* Types of condition jump used by macro-fusion. */
725 enum mf_jcc_kind
726 {
727 mf_jcc_jo = 0, /* base opcode 0x70 */
728 mf_jcc_jc, /* base opcode 0x72 */
729 mf_jcc_je, /* base opcode 0x74 */
730 mf_jcc_jna, /* base opcode 0x76 */
731 mf_jcc_js, /* base opcode 0x78 */
732 mf_jcc_jp, /* base opcode 0x7a */
733 mf_jcc_jl, /* base opcode 0x7c */
734 mf_jcc_jle, /* base opcode 0x7e */
735 };
736
737 /* Types of compare flag-modifying insntructions used by macro-fusion. */
738 enum mf_cmp_kind
739 {
740 mf_cmp_test_and, /* test/cmp */
741 mf_cmp_alu_cmp, /* add/sub/cmp */
742 mf_cmp_incdec /* inc/dec */
743 };
744
745 /* The maximum padding size for fused jcc. CMP like instruction can
746 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
747 prefixes. */
748 #define MAX_FUSED_JCC_PADDING_SIZE 20
749
750 /* The maximum number of prefixes added for an instruction. */
751 static unsigned int align_branch_prefix_size = 5;
752
753 /* Optimization:
754 1. Clear the REX_W bit with register operand if possible.
755 2. Above plus use 128bit vector instruction to clear the full vector
756 register.
757 */
758 static int optimize = 0;
759
760 /* Optimization:
761 1. Clear the REX_W bit with register operand if possible.
762 2. Above plus use 128bit vector instruction to clear the full vector
763 register.
764 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
765 "testb $imm7,%r8".
766 */
767 static int optimize_for_space = 0;
768
769 /* Register prefix used for error message. */
770 static const char *register_prefix = "%";
771
772 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
773 leave, push, and pop instructions so that gcc has the same stack
774 frame as in 32 bit mode. */
775 static char stackop_size = '\0';
776
777 /* Non-zero to optimize code alignment. */
778 int optimize_align_code = 1;
779
780 /* Non-zero to quieten some warnings. */
781 static int quiet_warnings = 0;
782
783 /* CPU name. */
784 static const char *cpu_arch_name = NULL;
785 static char *cpu_sub_arch_name = NULL;
786
787 /* CPU feature flags. */
788 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
789
790 /* If we have selected a cpu we are generating instructions for. */
791 static int cpu_arch_tune_set = 0;
792
793 /* Cpu we are generating instructions for. */
794 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
795
796 /* CPU feature flags of cpu we are generating instructions for. */
797 static i386_cpu_flags cpu_arch_tune_flags;
798
799 /* CPU instruction set architecture used. */
800 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
801
802 /* CPU feature flags of instruction set architecture used. */
803 i386_cpu_flags cpu_arch_isa_flags;
804
805 /* If set, conditional jumps are not automatically promoted to handle
806 larger than a byte offset. */
807 static unsigned int no_cond_jump_promotion = 0;
808
809 /* Encode SSE instructions with VEX prefix. */
810 static unsigned int sse2avx;
811
812 /* Encode scalar AVX instructions with specific vector length. */
813 static enum
814 {
815 vex128 = 0,
816 vex256
817 } avxscalar;
818
819 /* Encode VEX WIG instructions with specific vex.w. */
820 static enum
821 {
822 vexw0 = 0,
823 vexw1
824 } vexwig;
825
826 /* Encode scalar EVEX LIG instructions with specific vector length. */
827 static enum
828 {
829 evexl128 = 0,
830 evexl256,
831 evexl512
832 } evexlig;
833
834 /* Encode EVEX WIG instructions with specific evex.w. */
835 static enum
836 {
837 evexw0 = 0,
838 evexw1
839 } evexwig;
840
841 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
842 static enum rc_type evexrcig = rne;
843
844 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
845 static symbolS *GOT_symbol;
846
847 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
848 unsigned int x86_dwarf2_return_column;
849
850 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
851 int x86_cie_data_alignment;
852
853 /* Interface to relax_segment.
854 There are 3 major relax states for 386 jump insns because the
855 different types of jumps add different sizes to frags when we're
856 figuring out what sort of jump to choose to reach a given label.
857
858 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
859 branches which are handled by md_estimate_size_before_relax() and
860 i386_generic_table_relax_frag(). */
861
862 /* Types. */
863 #define UNCOND_JUMP 0
864 #define COND_JUMP 1
865 #define COND_JUMP86 2
866 #define BRANCH_PADDING 3
867 #define BRANCH_PREFIX 4
868 #define FUSED_JCC_PADDING 5
869
870 /* Sizes. */
871 #define CODE16 1
872 #define SMALL 0
873 #define SMALL16 (SMALL | CODE16)
874 #define BIG 2
875 #define BIG16 (BIG | CODE16)
876
877 #ifndef INLINE
878 #ifdef __GNUC__
879 #define INLINE __inline__
880 #else
881 #define INLINE
882 #endif
883 #endif
884
885 #define ENCODE_RELAX_STATE(type, size) \
886 ((relax_substateT) (((type) << 2) | (size)))
887 #define TYPE_FROM_RELAX_STATE(s) \
888 ((s) >> 2)
889 #define DISP_SIZE_FROM_RELAX_STATE(s) \
890 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
891
892 /* This table is used by relax_frag to promote short jumps to long
893 ones where necessary. SMALL (short) jumps may be promoted to BIG
894 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
895 don't allow a short jump in a 32 bit code segment to be promoted to
896 a 16 bit offset jump because it's slower (requires data size
897 prefix), and doesn't work, unless the destination is in the bottom
898 64k of the code segment (The top 16 bits of eip are zeroed). */
899
900 const relax_typeS md_relax_table[] =
901 {
902 /* The fields are:
903 1) most positive reach of this state,
904 2) most negative reach of this state,
905 3) how many bytes this mode will have in the variable part of the frag
906 4) which index into the table to try if we can't fit into this one. */
907
908 /* UNCOND_JUMP states. */
909 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
910 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
911 /* dword jmp adds 4 bytes to frag:
912 0 extra opcode bytes, 4 displacement bytes. */
913 {0, 0, 4, 0},
914 /* word jmp adds 2 byte2 to frag:
915 0 extra opcode bytes, 2 displacement bytes. */
916 {0, 0, 2, 0},
917
918 /* COND_JUMP states. */
919 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
920 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
921 /* dword conditionals adds 5 bytes to frag:
922 1 extra opcode byte, 4 displacement bytes. */
923 {0, 0, 5, 0},
924 /* word conditionals add 3 bytes to frag:
925 1 extra opcode byte, 2 displacement bytes. */
926 {0, 0, 3, 0},
927
928 /* COND_JUMP86 states. */
929 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
930 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
931 /* dword conditionals adds 5 bytes to frag:
932 1 extra opcode byte, 4 displacement bytes. */
933 {0, 0, 5, 0},
934 /* word conditionals add 4 bytes to frag:
935 1 displacement byte and a 3 byte long branch insn. */
936 {0, 0, 4, 0}
937 };
938
939 static const arch_entry cpu_arch[] =
940 {
941 /* Do not replace the first two entries - i386_target_format()
942 relies on them being there in this order. */
943 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
944 CPU_GENERIC32_FLAGS, 0 },
945 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
946 CPU_GENERIC64_FLAGS, 0 },
947 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
948 CPU_NONE_FLAGS, 0 },
949 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
950 CPU_I186_FLAGS, 0 },
951 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
952 CPU_I286_FLAGS, 0 },
953 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
954 CPU_I386_FLAGS, 0 },
955 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
956 CPU_I486_FLAGS, 0 },
957 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
958 CPU_I586_FLAGS, 0 },
959 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
960 CPU_I686_FLAGS, 0 },
961 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
962 CPU_I586_FLAGS, 0 },
963 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
964 CPU_PENTIUMPRO_FLAGS, 0 },
965 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
966 CPU_P2_FLAGS, 0 },
967 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
968 CPU_P3_FLAGS, 0 },
969 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
970 CPU_P4_FLAGS, 0 },
971 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
972 CPU_CORE_FLAGS, 0 },
973 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
974 CPU_NOCONA_FLAGS, 0 },
975 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
976 CPU_CORE_FLAGS, 1 },
977 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
978 CPU_CORE_FLAGS, 0 },
979 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
980 CPU_CORE2_FLAGS, 1 },
981 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
982 CPU_CORE2_FLAGS, 0 },
983 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
984 CPU_COREI7_FLAGS, 0 },
985 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
986 CPU_L1OM_FLAGS, 0 },
987 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
988 CPU_K1OM_FLAGS, 0 },
989 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
990 CPU_IAMCU_FLAGS, 0 },
991 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
992 CPU_K6_FLAGS, 0 },
993 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
994 CPU_K6_2_FLAGS, 0 },
995 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
996 CPU_ATHLON_FLAGS, 0 },
997 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
998 CPU_K8_FLAGS, 1 },
999 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
1000 CPU_K8_FLAGS, 0 },
1001 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1002 CPU_K8_FLAGS, 0 },
1003 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1004 CPU_AMDFAM10_FLAGS, 0 },
1005 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1006 CPU_BDVER1_FLAGS, 0 },
1007 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1008 CPU_BDVER2_FLAGS, 0 },
1009 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1010 CPU_BDVER3_FLAGS, 0 },
1011 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1012 CPU_BDVER4_FLAGS, 0 },
1013 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1014 CPU_ZNVER1_FLAGS, 0 },
1015 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1016 CPU_ZNVER2_FLAGS, 0 },
1017 { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1018 CPU_ZNVER3_FLAGS, 0 },
1019 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1020 CPU_BTVER1_FLAGS, 0 },
1021 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1022 CPU_BTVER2_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1024 CPU_8087_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1026 CPU_287_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1028 CPU_387_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1030 CPU_687_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1032 CPU_CMOV_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1034 CPU_FXSR_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1036 CPU_MMX_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1038 CPU_SSE_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1040 CPU_SSE2_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1042 CPU_SSE3_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1044 CPU_SSE4A_FLAGS, 0 },
1045 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1046 CPU_SSSE3_FLAGS, 0 },
1047 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1048 CPU_SSE4_1_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1050 CPU_SSE4_2_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1052 CPU_SSE4_2_FLAGS, 0 },
1053 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1054 CPU_AVX_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1056 CPU_AVX2_FLAGS, 0 },
1057 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1058 CPU_AVX512F_FLAGS, 0 },
1059 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1060 CPU_AVX512CD_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1062 CPU_AVX512ER_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1064 CPU_AVX512PF_FLAGS, 0 },
1065 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1066 CPU_AVX512DQ_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1068 CPU_AVX512BW_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1070 CPU_AVX512VL_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1072 CPU_VMX_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1074 CPU_VMFUNC_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1076 CPU_SMX_FLAGS, 0 },
1077 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1078 CPU_XSAVE_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1080 CPU_XSAVEOPT_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1082 CPU_XSAVEC_FLAGS, 0 },
1083 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1084 CPU_XSAVES_FLAGS, 0 },
1085 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1086 CPU_AES_FLAGS, 0 },
1087 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1088 CPU_PCLMUL_FLAGS, 0 },
1089 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1090 CPU_PCLMUL_FLAGS, 1 },
1091 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1092 CPU_FSGSBASE_FLAGS, 0 },
1093 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1094 CPU_RDRND_FLAGS, 0 },
1095 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1096 CPU_F16C_FLAGS, 0 },
1097 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1098 CPU_BMI2_FLAGS, 0 },
1099 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1100 CPU_FMA_FLAGS, 0 },
1101 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1102 CPU_FMA4_FLAGS, 0 },
1103 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1104 CPU_XOP_FLAGS, 0 },
1105 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1106 CPU_LWP_FLAGS, 0 },
1107 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1108 CPU_MOVBE_FLAGS, 0 },
1109 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1110 CPU_CX16_FLAGS, 0 },
1111 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1112 CPU_EPT_FLAGS, 0 },
1113 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1114 CPU_LZCNT_FLAGS, 0 },
1115 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1116 CPU_POPCNT_FLAGS, 0 },
1117 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1118 CPU_HLE_FLAGS, 0 },
1119 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1120 CPU_RTM_FLAGS, 0 },
1121 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1122 CPU_INVPCID_FLAGS, 0 },
1123 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1124 CPU_CLFLUSH_FLAGS, 0 },
1125 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1126 CPU_NOP_FLAGS, 0 },
1127 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1128 CPU_SYSCALL_FLAGS, 0 },
1129 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1130 CPU_RDTSCP_FLAGS, 0 },
1131 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1132 CPU_3DNOW_FLAGS, 0 },
1133 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1134 CPU_3DNOWA_FLAGS, 0 },
1135 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1136 CPU_PADLOCK_FLAGS, 0 },
1137 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1138 CPU_SVME_FLAGS, 1 },
1139 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1140 CPU_SVME_FLAGS, 0 },
1141 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1142 CPU_SSE4A_FLAGS, 0 },
1143 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1144 CPU_ABM_FLAGS, 0 },
1145 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1146 CPU_BMI_FLAGS, 0 },
1147 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1148 CPU_TBM_FLAGS, 0 },
1149 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1150 CPU_ADX_FLAGS, 0 },
1151 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1152 CPU_RDSEED_FLAGS, 0 },
1153 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1154 CPU_PRFCHW_FLAGS, 0 },
1155 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1156 CPU_SMAP_FLAGS, 0 },
1157 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1158 CPU_MPX_FLAGS, 0 },
1159 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1160 CPU_SHA_FLAGS, 0 },
1161 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1162 CPU_CLFLUSHOPT_FLAGS, 0 },
1163 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1164 CPU_PREFETCHWT1_FLAGS, 0 },
1165 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1166 CPU_SE1_FLAGS, 0 },
1167 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1168 CPU_CLWB_FLAGS, 0 },
1169 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512IFMA_FLAGS, 0 },
1171 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512VBMI_FLAGS, 0 },
1173 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_4FMAPS_FLAGS, 0 },
1175 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_4VNNIW_FLAGS, 0 },
1177 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1178 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1179 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1180 CPU_AVX512_VBMI2_FLAGS, 0 },
1181 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1182 CPU_AVX512_VNNI_FLAGS, 0 },
1183 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1184 CPU_AVX512_BITALG_FLAGS, 0 },
1185 { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1186 CPU_AVX_VNNI_FLAGS, 0 },
1187 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1188 CPU_CLZERO_FLAGS, 0 },
1189 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1190 CPU_MWAITX_FLAGS, 0 },
1191 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1192 CPU_OSPKE_FLAGS, 0 },
1193 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1194 CPU_RDPID_FLAGS, 0 },
1195 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1196 CPU_PTWRITE_FLAGS, 0 },
1197 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1198 CPU_IBT_FLAGS, 0 },
1199 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1200 CPU_SHSTK_FLAGS, 0 },
1201 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1202 CPU_GFNI_FLAGS, 0 },
1203 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1204 CPU_VAES_FLAGS, 0 },
1205 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1206 CPU_VPCLMULQDQ_FLAGS, 0 },
1207 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1208 CPU_WBNOINVD_FLAGS, 0 },
1209 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1210 CPU_PCONFIG_FLAGS, 0 },
1211 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1212 CPU_WAITPKG_FLAGS, 0 },
1213 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1214 CPU_CLDEMOTE_FLAGS, 0 },
1215 { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1216 CPU_AMX_INT8_FLAGS, 0 },
1217 { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1218 CPU_AMX_BF16_FLAGS, 0 },
1219 { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1220 CPU_AMX_TILE_FLAGS, 0 },
1221 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1222 CPU_MOVDIRI_FLAGS, 0 },
1223 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1224 CPU_MOVDIR64B_FLAGS, 0 },
1225 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1226 CPU_AVX512_BF16_FLAGS, 0 },
1227 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1228 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1229 { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1230 CPU_TDX_FLAGS, 0 },
1231 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1232 CPU_ENQCMD_FLAGS, 0 },
1233 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1234 CPU_SERIALIZE_FLAGS, 0 },
1235 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1236 CPU_RDPRU_FLAGS, 0 },
1237 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1238 CPU_MCOMMIT_FLAGS, 0 },
1239 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1240 CPU_SEV_ES_FLAGS, 0 },
1241 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1242 CPU_TSXLDTRK_FLAGS, 0 },
1243 { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1244 CPU_KL_FLAGS, 0 },
1245 { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1246 CPU_WIDEKL_FLAGS, 0 },
1247 { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1248 CPU_UINTR_FLAGS, 0 },
1249 { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1250 CPU_HRESET_FLAGS, 0 },
1251 };
1252
1253 static const noarch_entry cpu_noarch[] =
1254 {
1255 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1256 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1257 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1258 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1259 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1260 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1261 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1262 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1263 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1264 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1265 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1266 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1267 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1268 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1269 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1270 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1271 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1272 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1273 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1274 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1275 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1276 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1277 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1278 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1279 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1280 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1281 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1282 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1283 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1284 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1285 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1286 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1287 { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1288 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1289 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1290 { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1291 { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1292 { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1293 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1294 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1295 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1296 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1297 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1298 { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1299 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1300 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1301 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1302 { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1303 { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1304 { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1305 { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1306 };
1307
1308 #ifdef I386COFF
1309 /* Like s_lcomm_internal in gas/read.c but the alignment string
1310 is allowed to be optional. */
1311
1312 static symbolS *
1313 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1314 {
1315 addressT align = 0;
1316
1317 SKIP_WHITESPACE ();
1318
1319 if (needs_align
1320 && *input_line_pointer == ',')
1321 {
1322 align = parse_align (needs_align - 1);
1323
1324 if (align == (addressT) -1)
1325 return NULL;
1326 }
1327 else
1328 {
1329 if (size >= 8)
1330 align = 3;
1331 else if (size >= 4)
1332 align = 2;
1333 else if (size >= 2)
1334 align = 1;
1335 else
1336 align = 0;
1337 }
1338
1339 bss_alloc (symbolP, size, align);
1340 return symbolP;
1341 }
1342
1343 static void
1344 pe_lcomm (int needs_align)
1345 {
1346 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1347 }
1348 #endif
1349
1350 const pseudo_typeS md_pseudo_table[] =
1351 {
1352 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1353 {"align", s_align_bytes, 0},
1354 #else
1355 {"align", s_align_ptwo, 0},
1356 #endif
1357 {"arch", set_cpu_arch, 0},
1358 #ifndef I386COFF
1359 {"bss", s_bss, 0},
1360 #else
1361 {"lcomm", pe_lcomm, 1},
1362 #endif
1363 {"ffloat", float_cons, 'f'},
1364 {"dfloat", float_cons, 'd'},
1365 {"tfloat", float_cons, 'x'},
1366 {"value", cons, 2},
1367 {"slong", signed_cons, 4},
1368 {"noopt", s_ignore, 0},
1369 {"optim", s_ignore, 0},
1370 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1371 {"code16", set_code_flag, CODE_16BIT},
1372 {"code32", set_code_flag, CODE_32BIT},
1373 #ifdef BFD64
1374 {"code64", set_code_flag, CODE_64BIT},
1375 #endif
1376 {"intel_syntax", set_intel_syntax, 1},
1377 {"att_syntax", set_intel_syntax, 0},
1378 {"intel_mnemonic", set_intel_mnemonic, 1},
1379 {"att_mnemonic", set_intel_mnemonic, 0},
1380 {"allow_index_reg", set_allow_index_reg, 1},
1381 {"disallow_index_reg", set_allow_index_reg, 0},
1382 {"sse_check", set_check, 0},
1383 {"operand_check", set_check, 1},
1384 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1385 {"largecomm", handle_large_common, 0},
1386 #else
1387 {"file", dwarf2_directive_file, 0},
1388 {"loc", dwarf2_directive_loc, 0},
1389 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1390 #endif
1391 #ifdef TE_PE
1392 {"secrel32", pe_directive_secrel, 0},
1393 #endif
1394 {0, 0, 0}
1395 };
1396
1397 /* For interface with expression (). */
1398 extern char *input_line_pointer;
1399
1400 /* Hash table for instruction mnemonic lookup. */
1401 static htab_t op_hash;
1402
1403 /* Hash table for register lookup. */
1404 static htab_t reg_hash;
1405 \f
1406 /* Various efficient no-op patterns for aligning code labels.
1407 Note: Don't try to assemble the instructions in the comments.
1408 0L and 0w are not legal. */
1409 static const unsigned char f32_1[] =
1410 {0x90}; /* nop */
1411 static const unsigned char f32_2[] =
1412 {0x66,0x90}; /* xchg %ax,%ax */
1413 static const unsigned char f32_3[] =
1414 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1415 static const unsigned char f32_4[] =
1416 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1417 static const unsigned char f32_6[] =
1418 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1419 static const unsigned char f32_7[] =
1420 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1421 static const unsigned char f16_3[] =
1422 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1423 static const unsigned char f16_4[] =
1424 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1425 static const unsigned char jump_disp8[] =
1426 {0xeb}; /* jmp disp8 */
1427 static const unsigned char jump32_disp32[] =
1428 {0xe9}; /* jmp disp32 */
1429 static const unsigned char jump16_disp32[] =
1430 {0x66,0xe9}; /* jmp disp32 */
1431 /* 32-bit NOPs patterns. */
1432 static const unsigned char *const f32_patt[] = {
1433 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1434 };
1435 /* 16-bit NOPs patterns. */
1436 static const unsigned char *const f16_patt[] = {
1437 f32_1, f32_2, f16_3, f16_4
1438 };
1439 /* nopl (%[re]ax) */
1440 static const unsigned char alt_3[] =
1441 {0x0f,0x1f,0x00};
1442 /* nopl 0(%[re]ax) */
1443 static const unsigned char alt_4[] =
1444 {0x0f,0x1f,0x40,0x00};
1445 /* nopl 0(%[re]ax,%[re]ax,1) */
1446 static const unsigned char alt_5[] =
1447 {0x0f,0x1f,0x44,0x00,0x00};
1448 /* nopw 0(%[re]ax,%[re]ax,1) */
1449 static const unsigned char alt_6[] =
1450 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1451 /* nopl 0L(%[re]ax) */
1452 static const unsigned char alt_7[] =
1453 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1454 /* nopl 0L(%[re]ax,%[re]ax,1) */
1455 static const unsigned char alt_8[] =
1456 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1457 /* nopw 0L(%[re]ax,%[re]ax,1) */
1458 static const unsigned char alt_9[] =
1459 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1460 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1461 static const unsigned char alt_10[] =
1462 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1463 /* data16 nopw %cs:0L(%eax,%eax,1) */
1464 static const unsigned char alt_11[] =
1465 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1466 /* 32-bit and 64-bit NOPs patterns. */
1467 static const unsigned char *const alt_patt[] = {
1468 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1469 alt_9, alt_10, alt_11
1470 };
1471
1472 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1473 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1474
1475 static void
1476 i386_output_nops (char *where, const unsigned char *const *patt,
1477 int count, int max_single_nop_size)
1478
1479 {
1480 /* Place the longer NOP first. */
1481 int last;
1482 int offset;
1483 const unsigned char *nops;
1484
1485 if (max_single_nop_size < 1)
1486 {
1487 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1488 max_single_nop_size);
1489 return;
1490 }
1491
1492 nops = patt[max_single_nop_size - 1];
1493
1494 /* Use the smaller one if the requsted one isn't available. */
1495 if (nops == NULL)
1496 {
1497 max_single_nop_size--;
1498 nops = patt[max_single_nop_size - 1];
1499 }
1500
1501 last = count % max_single_nop_size;
1502
1503 count -= last;
1504 for (offset = 0; offset < count; offset += max_single_nop_size)
1505 memcpy (where + offset, nops, max_single_nop_size);
1506
1507 if (last)
1508 {
1509 nops = patt[last - 1];
1510 if (nops == NULL)
1511 {
1512 /* Use the smaller one plus one-byte NOP if the needed one
1513 isn't available. */
1514 last--;
1515 nops = patt[last - 1];
1516 memcpy (where + offset, nops, last);
1517 where[offset + last] = *patt[0];
1518 }
1519 else
1520 memcpy (where + offset, nops, last);
1521 }
1522 }
1523
1524 static INLINE int
1525 fits_in_imm7 (offsetT num)
1526 {
1527 return (num & 0x7f) == num;
1528 }
1529
1530 static INLINE int
1531 fits_in_imm31 (offsetT num)
1532 {
1533 return (num & 0x7fffffff) == num;
1534 }
1535
1536 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1537 single NOP instruction LIMIT. */
1538
1539 void
1540 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1541 {
1542 const unsigned char *const *patt = NULL;
1543 int max_single_nop_size;
1544 /* Maximum number of NOPs before switching to jump over NOPs. */
1545 int max_number_of_nops;
1546
1547 switch (fragP->fr_type)
1548 {
1549 case rs_fill_nop:
1550 case rs_align_code:
1551 break;
1552 case rs_machine_dependent:
1553 /* Allow NOP padding for jumps and calls. */
1554 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1555 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1556 break;
1557 /* Fall through. */
1558 default:
1559 return;
1560 }
1561
1562 /* We need to decide which NOP sequence to use for 32bit and
1563 64bit. When -mtune= is used:
1564
1565 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1566 PROCESSOR_GENERIC32, f32_patt will be used.
1567 2. For the rest, alt_patt will be used.
1568
1569 When -mtune= isn't used, alt_patt will be used if
1570 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1571 be used.
1572
1573 When -march= or .arch is used, we can't use anything beyond
1574 cpu_arch_isa_flags. */
1575
1576 if (flag_code == CODE_16BIT)
1577 {
1578 patt = f16_patt;
1579 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1580 /* Limit number of NOPs to 2 in 16-bit mode. */
1581 max_number_of_nops = 2;
1582 }
1583 else
1584 {
1585 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1586 {
1587 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1588 switch (cpu_arch_tune)
1589 {
1590 case PROCESSOR_UNKNOWN:
1591 /* We use cpu_arch_isa_flags to check if we SHOULD
1592 optimize with nops. */
1593 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1594 patt = alt_patt;
1595 else
1596 patt = f32_patt;
1597 break;
1598 case PROCESSOR_PENTIUM4:
1599 case PROCESSOR_NOCONA:
1600 case PROCESSOR_CORE:
1601 case PROCESSOR_CORE2:
1602 case PROCESSOR_COREI7:
1603 case PROCESSOR_L1OM:
1604 case PROCESSOR_K1OM:
1605 case PROCESSOR_GENERIC64:
1606 case PROCESSOR_K6:
1607 case PROCESSOR_ATHLON:
1608 case PROCESSOR_K8:
1609 case PROCESSOR_AMDFAM10:
1610 case PROCESSOR_BD:
1611 case PROCESSOR_ZNVER:
1612 case PROCESSOR_BT:
1613 patt = alt_patt;
1614 break;
1615 case PROCESSOR_I386:
1616 case PROCESSOR_I486:
1617 case PROCESSOR_PENTIUM:
1618 case PROCESSOR_PENTIUMPRO:
1619 case PROCESSOR_IAMCU:
1620 case PROCESSOR_GENERIC32:
1621 patt = f32_patt;
1622 break;
1623 }
1624 }
1625 else
1626 {
1627 switch (fragP->tc_frag_data.tune)
1628 {
1629 case PROCESSOR_UNKNOWN:
1630 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1631 PROCESSOR_UNKNOWN. */
1632 abort ();
1633 break;
1634
1635 case PROCESSOR_I386:
1636 case PROCESSOR_I486:
1637 case PROCESSOR_PENTIUM:
1638 case PROCESSOR_IAMCU:
1639 case PROCESSOR_K6:
1640 case PROCESSOR_ATHLON:
1641 case PROCESSOR_K8:
1642 case PROCESSOR_AMDFAM10:
1643 case PROCESSOR_BD:
1644 case PROCESSOR_ZNVER:
1645 case PROCESSOR_BT:
1646 case PROCESSOR_GENERIC32:
1647 /* We use cpu_arch_isa_flags to check if we CAN optimize
1648 with nops. */
1649 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1650 patt = alt_patt;
1651 else
1652 patt = f32_patt;
1653 break;
1654 case PROCESSOR_PENTIUMPRO:
1655 case PROCESSOR_PENTIUM4:
1656 case PROCESSOR_NOCONA:
1657 case PROCESSOR_CORE:
1658 case PROCESSOR_CORE2:
1659 case PROCESSOR_COREI7:
1660 case PROCESSOR_L1OM:
1661 case PROCESSOR_K1OM:
1662 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1663 patt = alt_patt;
1664 else
1665 patt = f32_patt;
1666 break;
1667 case PROCESSOR_GENERIC64:
1668 patt = alt_patt;
1669 break;
1670 }
1671 }
1672
1673 if (patt == f32_patt)
1674 {
1675 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1676 /* Limit number of NOPs to 2 for older processors. */
1677 max_number_of_nops = 2;
1678 }
1679 else
1680 {
1681 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1682 /* Limit number of NOPs to 7 for newer processors. */
1683 max_number_of_nops = 7;
1684 }
1685 }
1686
1687 if (limit == 0)
1688 limit = max_single_nop_size;
1689
1690 if (fragP->fr_type == rs_fill_nop)
1691 {
1692 /* Output NOPs for .nop directive. */
1693 if (limit > max_single_nop_size)
1694 {
1695 as_bad_where (fragP->fr_file, fragP->fr_line,
1696 _("invalid single nop size: %d "
1697 "(expect within [0, %d])"),
1698 limit, max_single_nop_size);
1699 return;
1700 }
1701 }
1702 else if (fragP->fr_type != rs_machine_dependent)
1703 fragP->fr_var = count;
1704
1705 if ((count / max_single_nop_size) > max_number_of_nops)
1706 {
1707 /* Generate jump over NOPs. */
1708 offsetT disp = count - 2;
1709 if (fits_in_imm7 (disp))
1710 {
1711 /* Use "jmp disp8" if possible. */
1712 count = disp;
1713 where[0] = jump_disp8[0];
1714 where[1] = count;
1715 where += 2;
1716 }
1717 else
1718 {
1719 unsigned int size_of_jump;
1720
1721 if (flag_code == CODE_16BIT)
1722 {
1723 where[0] = jump16_disp32[0];
1724 where[1] = jump16_disp32[1];
1725 size_of_jump = 2;
1726 }
1727 else
1728 {
1729 where[0] = jump32_disp32[0];
1730 size_of_jump = 1;
1731 }
1732
1733 count -= size_of_jump + 4;
1734 if (!fits_in_imm31 (count))
1735 {
1736 as_bad_where (fragP->fr_file, fragP->fr_line,
1737 _("jump over nop padding out of range"));
1738 return;
1739 }
1740
1741 md_number_to_chars (where + size_of_jump, count, 4);
1742 where += size_of_jump + 4;
1743 }
1744 }
1745
1746 /* Generate multiple NOPs. */
1747 i386_output_nops (where, patt, count, limit);
1748 }
1749
1750 static INLINE int
1751 operand_type_all_zero (const union i386_operand_type *x)
1752 {
1753 switch (ARRAY_SIZE(x->array))
1754 {
1755 case 3:
1756 if (x->array[2])
1757 return 0;
1758 /* Fall through. */
1759 case 2:
1760 if (x->array[1])
1761 return 0;
1762 /* Fall through. */
1763 case 1:
1764 return !x->array[0];
1765 default:
1766 abort ();
1767 }
1768 }
1769
1770 static INLINE void
1771 operand_type_set (union i386_operand_type *x, unsigned int v)
1772 {
1773 switch (ARRAY_SIZE(x->array))
1774 {
1775 case 3:
1776 x->array[2] = v;
1777 /* Fall through. */
1778 case 2:
1779 x->array[1] = v;
1780 /* Fall through. */
1781 case 1:
1782 x->array[0] = v;
1783 /* Fall through. */
1784 break;
1785 default:
1786 abort ();
1787 }
1788
1789 x->bitfield.class = ClassNone;
1790 x->bitfield.instance = InstanceNone;
1791 }
1792
1793 static INLINE int
1794 operand_type_equal (const union i386_operand_type *x,
1795 const union i386_operand_type *y)
1796 {
1797 switch (ARRAY_SIZE(x->array))
1798 {
1799 case 3:
1800 if (x->array[2] != y->array[2])
1801 return 0;
1802 /* Fall through. */
1803 case 2:
1804 if (x->array[1] != y->array[1])
1805 return 0;
1806 /* Fall through. */
1807 case 1:
1808 return x->array[0] == y->array[0];
1809 break;
1810 default:
1811 abort ();
1812 }
1813 }
1814
1815 static INLINE int
1816 cpu_flags_all_zero (const union i386_cpu_flags *x)
1817 {
1818 switch (ARRAY_SIZE(x->array))
1819 {
1820 case 4:
1821 if (x->array[3])
1822 return 0;
1823 /* Fall through. */
1824 case 3:
1825 if (x->array[2])
1826 return 0;
1827 /* Fall through. */
1828 case 2:
1829 if (x->array[1])
1830 return 0;
1831 /* Fall through. */
1832 case 1:
1833 return !x->array[0];
1834 default:
1835 abort ();
1836 }
1837 }
1838
1839 static INLINE int
1840 cpu_flags_equal (const union i386_cpu_flags *x,
1841 const union i386_cpu_flags *y)
1842 {
1843 switch (ARRAY_SIZE(x->array))
1844 {
1845 case 4:
1846 if (x->array[3] != y->array[3])
1847 return 0;
1848 /* Fall through. */
1849 case 3:
1850 if (x->array[2] != y->array[2])
1851 return 0;
1852 /* Fall through. */
1853 case 2:
1854 if (x->array[1] != y->array[1])
1855 return 0;
1856 /* Fall through. */
1857 case 1:
1858 return x->array[0] == y->array[0];
1859 break;
1860 default:
1861 abort ();
1862 }
1863 }
1864
1865 static INLINE int
1866 cpu_flags_check_cpu64 (i386_cpu_flags f)
1867 {
1868 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1869 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1870 }
1871
1872 static INLINE i386_cpu_flags
1873 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1874 {
1875 switch (ARRAY_SIZE (x.array))
1876 {
1877 case 4:
1878 x.array [3] &= y.array [3];
1879 /* Fall through. */
1880 case 3:
1881 x.array [2] &= y.array [2];
1882 /* Fall through. */
1883 case 2:
1884 x.array [1] &= y.array [1];
1885 /* Fall through. */
1886 case 1:
1887 x.array [0] &= y.array [0];
1888 break;
1889 default:
1890 abort ();
1891 }
1892 return x;
1893 }
1894
1895 static INLINE i386_cpu_flags
1896 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1897 {
1898 switch (ARRAY_SIZE (x.array))
1899 {
1900 case 4:
1901 x.array [3] |= y.array [3];
1902 /* Fall through. */
1903 case 3:
1904 x.array [2] |= y.array [2];
1905 /* Fall through. */
1906 case 2:
1907 x.array [1] |= y.array [1];
1908 /* Fall through. */
1909 case 1:
1910 x.array [0] |= y.array [0];
1911 break;
1912 default:
1913 abort ();
1914 }
1915 return x;
1916 }
1917
1918 static INLINE i386_cpu_flags
1919 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1920 {
1921 switch (ARRAY_SIZE (x.array))
1922 {
1923 case 4:
1924 x.array [3] &= ~y.array [3];
1925 /* Fall through. */
1926 case 3:
1927 x.array [2] &= ~y.array [2];
1928 /* Fall through. */
1929 case 2:
1930 x.array [1] &= ~y.array [1];
1931 /* Fall through. */
1932 case 1:
1933 x.array [0] &= ~y.array [0];
1934 break;
1935 default:
1936 abort ();
1937 }
1938 return x;
1939 }
1940
1941 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1942
1943 #define CPU_FLAGS_ARCH_MATCH 0x1
1944 #define CPU_FLAGS_64BIT_MATCH 0x2
1945
1946 #define CPU_FLAGS_PERFECT_MATCH \
1947 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1948
1949 /* Return CPU flags match bits. */
1950
1951 static int
1952 cpu_flags_match (const insn_template *t)
1953 {
1954 i386_cpu_flags x = t->cpu_flags;
1955 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1956
1957 x.bitfield.cpu64 = 0;
1958 x.bitfield.cpuno64 = 0;
1959
1960 if (cpu_flags_all_zero (&x))
1961 {
1962 /* This instruction is available on all archs. */
1963 match |= CPU_FLAGS_ARCH_MATCH;
1964 }
1965 else
1966 {
1967 /* This instruction is available only on some archs. */
1968 i386_cpu_flags cpu = cpu_arch_flags;
1969
1970 /* AVX512VL is no standalone feature - match it and then strip it. */
1971 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1972 return match;
1973 x.bitfield.cpuavx512vl = 0;
1974
1975 cpu = cpu_flags_and (x, cpu);
1976 if (!cpu_flags_all_zero (&cpu))
1977 {
1978 if (x.bitfield.cpuavx)
1979 {
1980 /* We need to check a few extra flags with AVX. */
1981 if (cpu.bitfield.cpuavx
1982 && (!t->opcode_modifier.sse2avx
1983 || (sse2avx && !i.prefix[DATA_PREFIX]))
1984 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1985 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1986 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1987 match |= CPU_FLAGS_ARCH_MATCH;
1988 }
1989 else if (x.bitfield.cpuavx512f)
1990 {
1991 /* We need to check a few extra flags with AVX512F. */
1992 if (cpu.bitfield.cpuavx512f
1993 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1994 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1995 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1996 match |= CPU_FLAGS_ARCH_MATCH;
1997 }
1998 else
1999 match |= CPU_FLAGS_ARCH_MATCH;
2000 }
2001 }
2002 return match;
2003 }
2004
2005 static INLINE i386_operand_type
2006 operand_type_and (i386_operand_type x, i386_operand_type y)
2007 {
2008 if (x.bitfield.class != y.bitfield.class)
2009 x.bitfield.class = ClassNone;
2010 if (x.bitfield.instance != y.bitfield.instance)
2011 x.bitfield.instance = InstanceNone;
2012
2013 switch (ARRAY_SIZE (x.array))
2014 {
2015 case 3:
2016 x.array [2] &= y.array [2];
2017 /* Fall through. */
2018 case 2:
2019 x.array [1] &= y.array [1];
2020 /* Fall through. */
2021 case 1:
2022 x.array [0] &= y.array [0];
2023 break;
2024 default:
2025 abort ();
2026 }
2027 return x;
2028 }
2029
2030 static INLINE i386_operand_type
2031 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2032 {
2033 gas_assert (y.bitfield.class == ClassNone);
2034 gas_assert (y.bitfield.instance == InstanceNone);
2035
2036 switch (ARRAY_SIZE (x.array))
2037 {
2038 case 3:
2039 x.array [2] &= ~y.array [2];
2040 /* Fall through. */
2041 case 2:
2042 x.array [1] &= ~y.array [1];
2043 /* Fall through. */
2044 case 1:
2045 x.array [0] &= ~y.array [0];
2046 break;
2047 default:
2048 abort ();
2049 }
2050 return x;
2051 }
2052
2053 static INLINE i386_operand_type
2054 operand_type_or (i386_operand_type x, i386_operand_type y)
2055 {
2056 gas_assert (x.bitfield.class == ClassNone ||
2057 y.bitfield.class == ClassNone ||
2058 x.bitfield.class == y.bitfield.class);
2059 gas_assert (x.bitfield.instance == InstanceNone ||
2060 y.bitfield.instance == InstanceNone ||
2061 x.bitfield.instance == y.bitfield.instance);
2062
2063 switch (ARRAY_SIZE (x.array))
2064 {
2065 case 3:
2066 x.array [2] |= y.array [2];
2067 /* Fall through. */
2068 case 2:
2069 x.array [1] |= y.array [1];
2070 /* Fall through. */
2071 case 1:
2072 x.array [0] |= y.array [0];
2073 break;
2074 default:
2075 abort ();
2076 }
2077 return x;
2078 }
2079
2080 static INLINE i386_operand_type
2081 operand_type_xor (i386_operand_type x, i386_operand_type y)
2082 {
2083 gas_assert (y.bitfield.class == ClassNone);
2084 gas_assert (y.bitfield.instance == InstanceNone);
2085
2086 switch (ARRAY_SIZE (x.array))
2087 {
2088 case 3:
2089 x.array [2] ^= y.array [2];
2090 /* Fall through. */
2091 case 2:
2092 x.array [1] ^= y.array [1];
2093 /* Fall through. */
2094 case 1:
2095 x.array [0] ^= y.array [0];
2096 break;
2097 default:
2098 abort ();
2099 }
2100 return x;
2101 }
2102
2103 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2104 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2105 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2106 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2107 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2108 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2109 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2110 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2111 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2112 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2113 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2114 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2115 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2116 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2117 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2118 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2119 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2120
2121 enum operand_type
2122 {
2123 reg,
2124 imm,
2125 disp,
2126 anymem
2127 };
2128
2129 static INLINE int
2130 operand_type_check (i386_operand_type t, enum operand_type c)
2131 {
2132 switch (c)
2133 {
2134 case reg:
2135 return t.bitfield.class == Reg;
2136
2137 case imm:
2138 return (t.bitfield.imm8
2139 || t.bitfield.imm8s
2140 || t.bitfield.imm16
2141 || t.bitfield.imm32
2142 || t.bitfield.imm32s
2143 || t.bitfield.imm64);
2144
2145 case disp:
2146 return (t.bitfield.disp8
2147 || t.bitfield.disp16
2148 || t.bitfield.disp32
2149 || t.bitfield.disp32s
2150 || t.bitfield.disp64);
2151
2152 case anymem:
2153 return (t.bitfield.disp8
2154 || t.bitfield.disp16
2155 || t.bitfield.disp32
2156 || t.bitfield.disp32s
2157 || t.bitfield.disp64
2158 || t.bitfield.baseindex);
2159
2160 default:
2161 abort ();
2162 }
2163
2164 return 0;
2165 }
2166
2167 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2168 between operand GIVEN and opeand WANTED for instruction template T. */
2169
2170 static INLINE int
2171 match_operand_size (const insn_template *t, unsigned int wanted,
2172 unsigned int given)
2173 {
2174 return !((i.types[given].bitfield.byte
2175 && !t->operand_types[wanted].bitfield.byte)
2176 || (i.types[given].bitfield.word
2177 && !t->operand_types[wanted].bitfield.word)
2178 || (i.types[given].bitfield.dword
2179 && !t->operand_types[wanted].bitfield.dword)
2180 || (i.types[given].bitfield.qword
2181 && !t->operand_types[wanted].bitfield.qword)
2182 || (i.types[given].bitfield.tbyte
2183 && !t->operand_types[wanted].bitfield.tbyte));
2184 }
2185
2186 /* Return 1 if there is no conflict in SIMD register between operand
2187 GIVEN and opeand WANTED for instruction template T. */
2188
2189 static INLINE int
2190 match_simd_size (const insn_template *t, unsigned int wanted,
2191 unsigned int given)
2192 {
2193 return !((i.types[given].bitfield.xmmword
2194 && !t->operand_types[wanted].bitfield.xmmword)
2195 || (i.types[given].bitfield.ymmword
2196 && !t->operand_types[wanted].bitfield.ymmword)
2197 || (i.types[given].bitfield.zmmword
2198 && !t->operand_types[wanted].bitfield.zmmword)
2199 || (i.types[given].bitfield.tmmword
2200 && !t->operand_types[wanted].bitfield.tmmword));
2201 }
2202
2203 /* Return 1 if there is no conflict in any size between operand GIVEN
2204 and opeand WANTED for instruction template T. */
2205
2206 static INLINE int
2207 match_mem_size (const insn_template *t, unsigned int wanted,
2208 unsigned int given)
2209 {
2210 return (match_operand_size (t, wanted, given)
2211 && !((i.types[given].bitfield.unspecified
2212 && !i.broadcast
2213 && !t->operand_types[wanted].bitfield.unspecified)
2214 || (i.types[given].bitfield.fword
2215 && !t->operand_types[wanted].bitfield.fword)
2216 /* For scalar opcode templates to allow register and memory
2217 operands at the same time, some special casing is needed
2218 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2219 down-conversion vpmov*. */
2220 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2221 && t->operand_types[wanted].bitfield.byte
2222 + t->operand_types[wanted].bitfield.word
2223 + t->operand_types[wanted].bitfield.dword
2224 + t->operand_types[wanted].bitfield.qword
2225 > !!t->opcode_modifier.broadcast)
2226 ? (i.types[given].bitfield.xmmword
2227 || i.types[given].bitfield.ymmword
2228 || i.types[given].bitfield.zmmword)
2229 : !match_simd_size(t, wanted, given))));
2230 }
2231
2232 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2233 operands for instruction template T, and it has MATCH_REVERSE set if there
2234 is no size conflict on any operands for the template with operands reversed
2235 (and the template allows for reversing in the first place). */
2236
2237 #define MATCH_STRAIGHT 1
2238 #define MATCH_REVERSE 2
2239
2240 static INLINE unsigned int
2241 operand_size_match (const insn_template *t)
2242 {
2243 unsigned int j, match = MATCH_STRAIGHT;
2244
2245 /* Don't check non-absolute jump instructions. */
2246 if (t->opcode_modifier.jump
2247 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2248 return match;
2249
2250 /* Check memory and accumulator operand size. */
2251 for (j = 0; j < i.operands; j++)
2252 {
2253 if (i.types[j].bitfield.class != Reg
2254 && i.types[j].bitfield.class != RegSIMD
2255 && t->opcode_modifier.anysize)
2256 continue;
2257
2258 if (t->operand_types[j].bitfield.class == Reg
2259 && !match_operand_size (t, j, j))
2260 {
2261 match = 0;
2262 break;
2263 }
2264
2265 if (t->operand_types[j].bitfield.class == RegSIMD
2266 && !match_simd_size (t, j, j))
2267 {
2268 match = 0;
2269 break;
2270 }
2271
2272 if (t->operand_types[j].bitfield.instance == Accum
2273 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2274 {
2275 match = 0;
2276 break;
2277 }
2278
2279 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2280 {
2281 match = 0;
2282 break;
2283 }
2284 }
2285
2286 if (!t->opcode_modifier.d)
2287 {
2288 mismatch:
2289 if (!match)
2290 i.error = operand_size_mismatch;
2291 return match;
2292 }
2293
2294 /* Check reverse. */
2295 gas_assert (i.operands >= 2 && i.operands <= 3);
2296
2297 for (j = 0; j < i.operands; j++)
2298 {
2299 unsigned int given = i.operands - j - 1;
2300
2301 if (t->operand_types[j].bitfield.class == Reg
2302 && !match_operand_size (t, j, given))
2303 goto mismatch;
2304
2305 if (t->operand_types[j].bitfield.class == RegSIMD
2306 && !match_simd_size (t, j, given))
2307 goto mismatch;
2308
2309 if (t->operand_types[j].bitfield.instance == Accum
2310 && (!match_operand_size (t, j, given)
2311 || !match_simd_size (t, j, given)))
2312 goto mismatch;
2313
2314 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2315 goto mismatch;
2316 }
2317
2318 return match | MATCH_REVERSE;
2319 }
2320
2321 static INLINE int
2322 operand_type_match (i386_operand_type overlap,
2323 i386_operand_type given)
2324 {
2325 i386_operand_type temp = overlap;
2326
2327 temp.bitfield.unspecified = 0;
2328 temp.bitfield.byte = 0;
2329 temp.bitfield.word = 0;
2330 temp.bitfield.dword = 0;
2331 temp.bitfield.fword = 0;
2332 temp.bitfield.qword = 0;
2333 temp.bitfield.tbyte = 0;
2334 temp.bitfield.xmmword = 0;
2335 temp.bitfield.ymmword = 0;
2336 temp.bitfield.zmmword = 0;
2337 temp.bitfield.tmmword = 0;
2338 if (operand_type_all_zero (&temp))
2339 goto mismatch;
2340
2341 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2342 return 1;
2343
2344 mismatch:
2345 i.error = operand_type_mismatch;
2346 return 0;
2347 }
2348
2349 /* If given types g0 and g1 are registers they must be of the same type
2350 unless the expected operand type register overlap is null.
2351 Some Intel syntax memory operand size checking also happens here. */
2352
2353 static INLINE int
2354 operand_type_register_match (i386_operand_type g0,
2355 i386_operand_type t0,
2356 i386_operand_type g1,
2357 i386_operand_type t1)
2358 {
2359 if (g0.bitfield.class != Reg
2360 && g0.bitfield.class != RegSIMD
2361 && (!operand_type_check (g0, anymem)
2362 || g0.bitfield.unspecified
2363 || (t0.bitfield.class != Reg
2364 && t0.bitfield.class != RegSIMD)))
2365 return 1;
2366
2367 if (g1.bitfield.class != Reg
2368 && g1.bitfield.class != RegSIMD
2369 && (!operand_type_check (g1, anymem)
2370 || g1.bitfield.unspecified
2371 || (t1.bitfield.class != Reg
2372 && t1.bitfield.class != RegSIMD)))
2373 return 1;
2374
2375 if (g0.bitfield.byte == g1.bitfield.byte
2376 && g0.bitfield.word == g1.bitfield.word
2377 && g0.bitfield.dword == g1.bitfield.dword
2378 && g0.bitfield.qword == g1.bitfield.qword
2379 && g0.bitfield.xmmword == g1.bitfield.xmmword
2380 && g0.bitfield.ymmword == g1.bitfield.ymmword
2381 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2382 return 1;
2383
2384 if (!(t0.bitfield.byte & t1.bitfield.byte)
2385 && !(t0.bitfield.word & t1.bitfield.word)
2386 && !(t0.bitfield.dword & t1.bitfield.dword)
2387 && !(t0.bitfield.qword & t1.bitfield.qword)
2388 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2389 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2390 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2391 return 1;
2392
2393 i.error = register_type_mismatch;
2394
2395 return 0;
2396 }
2397
2398 static INLINE unsigned int
2399 register_number (const reg_entry *r)
2400 {
2401 unsigned int nr = r->reg_num;
2402
2403 if (r->reg_flags & RegRex)
2404 nr += 8;
2405
2406 if (r->reg_flags & RegVRex)
2407 nr += 16;
2408
2409 return nr;
2410 }
2411
2412 static INLINE unsigned int
2413 mode_from_disp_size (i386_operand_type t)
2414 {
2415 if (t.bitfield.disp8)
2416 return 1;
2417 else if (t.bitfield.disp16
2418 || t.bitfield.disp32
2419 || t.bitfield.disp32s)
2420 return 2;
2421 else
2422 return 0;
2423 }
2424
2425 static INLINE int
2426 fits_in_signed_byte (addressT num)
2427 {
2428 return num + 0x80 <= 0xff;
2429 }
2430
2431 static INLINE int
2432 fits_in_unsigned_byte (addressT num)
2433 {
2434 return num <= 0xff;
2435 }
2436
2437 static INLINE int
2438 fits_in_unsigned_word (addressT num)
2439 {
2440 return num <= 0xffff;
2441 }
2442
2443 static INLINE int
2444 fits_in_signed_word (addressT num)
2445 {
2446 return num + 0x8000 <= 0xffff;
2447 }
2448
2449 static INLINE int
2450 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2451 {
2452 #ifndef BFD64
2453 return 1;
2454 #else
2455 return num + 0x80000000 <= 0xffffffff;
2456 #endif
2457 } /* fits_in_signed_long() */
2458
2459 static INLINE int
2460 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2461 {
2462 #ifndef BFD64
2463 return 1;
2464 #else
2465 return num <= 0xffffffff;
2466 #endif
2467 } /* fits_in_unsigned_long() */
2468
2469 static INLINE int
2470 fits_in_disp8 (offsetT num)
2471 {
2472 int shift = i.memshift;
2473 unsigned int mask;
2474
2475 if (shift == -1)
2476 abort ();
2477
2478 mask = (1 << shift) - 1;
2479
2480 /* Return 0 if NUM isn't properly aligned. */
2481 if ((num & mask))
2482 return 0;
2483
2484 /* Check if NUM will fit in 8bit after shift. */
2485 return fits_in_signed_byte (num >> shift);
2486 }
2487
2488 static INLINE int
2489 fits_in_imm4 (offsetT num)
2490 {
2491 return (num & 0xf) == num;
2492 }
2493
2494 static i386_operand_type
2495 smallest_imm_type (offsetT num)
2496 {
2497 i386_operand_type t;
2498
2499 operand_type_set (&t, 0);
2500 t.bitfield.imm64 = 1;
2501
2502 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2503 {
2504 /* This code is disabled on the 486 because all the Imm1 forms
2505 in the opcode table are slower on the i486. They're the
2506 versions with the implicitly specified single-position
2507 displacement, which has another syntax if you really want to
2508 use that form. */
2509 t.bitfield.imm1 = 1;
2510 t.bitfield.imm8 = 1;
2511 t.bitfield.imm8s = 1;
2512 t.bitfield.imm16 = 1;
2513 t.bitfield.imm32 = 1;
2514 t.bitfield.imm32s = 1;
2515 }
2516 else if (fits_in_signed_byte (num))
2517 {
2518 t.bitfield.imm8 = 1;
2519 t.bitfield.imm8s = 1;
2520 t.bitfield.imm16 = 1;
2521 t.bitfield.imm32 = 1;
2522 t.bitfield.imm32s = 1;
2523 }
2524 else if (fits_in_unsigned_byte (num))
2525 {
2526 t.bitfield.imm8 = 1;
2527 t.bitfield.imm16 = 1;
2528 t.bitfield.imm32 = 1;
2529 t.bitfield.imm32s = 1;
2530 }
2531 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2532 {
2533 t.bitfield.imm16 = 1;
2534 t.bitfield.imm32 = 1;
2535 t.bitfield.imm32s = 1;
2536 }
2537 else if (fits_in_signed_long (num))
2538 {
2539 t.bitfield.imm32 = 1;
2540 t.bitfield.imm32s = 1;
2541 }
2542 else if (fits_in_unsigned_long (num))
2543 t.bitfield.imm32 = 1;
2544
2545 return t;
2546 }
2547
2548 static offsetT
2549 offset_in_range (offsetT val, int size)
2550 {
2551 addressT mask;
2552
2553 switch (size)
2554 {
2555 case 1: mask = ((addressT) 1 << 8) - 1; break;
2556 case 2: mask = ((addressT) 1 << 16) - 1; break;
2557 case 4: mask = ((addressT) 2 << 31) - 1; break;
2558 #ifdef BFD64
2559 case 8: mask = ((addressT) 2 << 63) - 1; break;
2560 #endif
2561 default: abort ();
2562 }
2563
2564 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2565 {
2566 char buf1[40], buf2[40];
2567
2568 sprint_value (buf1, val);
2569 sprint_value (buf2, val & mask);
2570 as_warn (_("%s shortened to %s"), buf1, buf2);
2571 }
2572 return val & mask;
2573 }
2574
2575 enum PREFIX_GROUP
2576 {
2577 PREFIX_EXIST = 0,
2578 PREFIX_LOCK,
2579 PREFIX_REP,
2580 PREFIX_DS,
2581 PREFIX_OTHER
2582 };
2583
2584 /* Returns
2585 a. PREFIX_EXIST if attempting to add a prefix where one from the
2586 same class already exists.
2587 b. PREFIX_LOCK if lock prefix is added.
2588 c. PREFIX_REP if rep/repne prefix is added.
2589 d. PREFIX_DS if ds prefix is added.
2590 e. PREFIX_OTHER if other prefix is added.
2591 */
2592
2593 static enum PREFIX_GROUP
2594 add_prefix (unsigned int prefix)
2595 {
2596 enum PREFIX_GROUP ret = PREFIX_OTHER;
2597 unsigned int q;
2598
2599 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2600 && flag_code == CODE_64BIT)
2601 {
2602 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2603 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2604 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2605 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2606 ret = PREFIX_EXIST;
2607 q = REX_PREFIX;
2608 }
2609 else
2610 {
2611 switch (prefix)
2612 {
2613 default:
2614 abort ();
2615
2616 case DS_PREFIX_OPCODE:
2617 ret = PREFIX_DS;
2618 /* Fall through. */
2619 case CS_PREFIX_OPCODE:
2620 case ES_PREFIX_OPCODE:
2621 case FS_PREFIX_OPCODE:
2622 case GS_PREFIX_OPCODE:
2623 case SS_PREFIX_OPCODE:
2624 q = SEG_PREFIX;
2625 break;
2626
2627 case REPNE_PREFIX_OPCODE:
2628 case REPE_PREFIX_OPCODE:
2629 q = REP_PREFIX;
2630 ret = PREFIX_REP;
2631 break;
2632
2633 case LOCK_PREFIX_OPCODE:
2634 q = LOCK_PREFIX;
2635 ret = PREFIX_LOCK;
2636 break;
2637
2638 case FWAIT_OPCODE:
2639 q = WAIT_PREFIX;
2640 break;
2641
2642 case ADDR_PREFIX_OPCODE:
2643 q = ADDR_PREFIX;
2644 break;
2645
2646 case DATA_PREFIX_OPCODE:
2647 q = DATA_PREFIX;
2648 break;
2649 }
2650 if (i.prefix[q] != 0)
2651 ret = PREFIX_EXIST;
2652 }
2653
2654 if (ret)
2655 {
2656 if (!i.prefix[q])
2657 ++i.prefixes;
2658 i.prefix[q] |= prefix;
2659 }
2660 else
2661 as_bad (_("same type of prefix used twice"));
2662
2663 return ret;
2664 }
2665
2666 static void
2667 update_code_flag (int value, int check)
2668 {
2669 PRINTF_LIKE ((*as_error));
2670
2671 flag_code = (enum flag_code) value;
2672 if (flag_code == CODE_64BIT)
2673 {
2674 cpu_arch_flags.bitfield.cpu64 = 1;
2675 cpu_arch_flags.bitfield.cpuno64 = 0;
2676 }
2677 else
2678 {
2679 cpu_arch_flags.bitfield.cpu64 = 0;
2680 cpu_arch_flags.bitfield.cpuno64 = 1;
2681 }
2682 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2683 {
2684 if (check)
2685 as_error = as_fatal;
2686 else
2687 as_error = as_bad;
2688 (*as_error) (_("64bit mode not supported on `%s'."),
2689 cpu_arch_name ? cpu_arch_name : default_arch);
2690 }
2691 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2692 {
2693 if (check)
2694 as_error = as_fatal;
2695 else
2696 as_error = as_bad;
2697 (*as_error) (_("32bit mode not supported on `%s'."),
2698 cpu_arch_name ? cpu_arch_name : default_arch);
2699 }
2700 stackop_size = '\0';
2701 }
2702
2703 static void
2704 set_code_flag (int value)
2705 {
2706 update_code_flag (value, 0);
2707 }
2708
2709 static void
2710 set_16bit_gcc_code_flag (int new_code_flag)
2711 {
2712 flag_code = (enum flag_code) new_code_flag;
2713 if (flag_code != CODE_16BIT)
2714 abort ();
2715 cpu_arch_flags.bitfield.cpu64 = 0;
2716 cpu_arch_flags.bitfield.cpuno64 = 1;
2717 stackop_size = LONG_MNEM_SUFFIX;
2718 }
2719
2720 static void
2721 set_intel_syntax (int syntax_flag)
2722 {
2723 /* Find out if register prefixing is specified. */
2724 int ask_naked_reg = 0;
2725
2726 SKIP_WHITESPACE ();
2727 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2728 {
2729 char *string;
2730 int e = get_symbol_name (&string);
2731
2732 if (strcmp (string, "prefix") == 0)
2733 ask_naked_reg = 1;
2734 else if (strcmp (string, "noprefix") == 0)
2735 ask_naked_reg = -1;
2736 else
2737 as_bad (_("bad argument to syntax directive."));
2738 (void) restore_line_pointer (e);
2739 }
2740 demand_empty_rest_of_line ();
2741
2742 intel_syntax = syntax_flag;
2743
2744 if (ask_naked_reg == 0)
2745 allow_naked_reg = (intel_syntax
2746 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2747 else
2748 allow_naked_reg = (ask_naked_reg < 0);
2749
2750 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2751
2752 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2753 identifier_chars['$'] = intel_syntax ? '$' : 0;
2754 register_prefix = allow_naked_reg ? "" : "%";
2755 }
2756
2757 static void
2758 set_intel_mnemonic (int mnemonic_flag)
2759 {
2760 intel_mnemonic = mnemonic_flag;
2761 }
2762
2763 static void
2764 set_allow_index_reg (int flag)
2765 {
2766 allow_index_reg = flag;
2767 }
2768
2769 static void
2770 set_check (int what)
2771 {
2772 enum check_kind *kind;
2773 const char *str;
2774
2775 if (what)
2776 {
2777 kind = &operand_check;
2778 str = "operand";
2779 }
2780 else
2781 {
2782 kind = &sse_check;
2783 str = "sse";
2784 }
2785
2786 SKIP_WHITESPACE ();
2787
2788 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2789 {
2790 char *string;
2791 int e = get_symbol_name (&string);
2792
2793 if (strcmp (string, "none") == 0)
2794 *kind = check_none;
2795 else if (strcmp (string, "warning") == 0)
2796 *kind = check_warning;
2797 else if (strcmp (string, "error") == 0)
2798 *kind = check_error;
2799 else
2800 as_bad (_("bad argument to %s_check directive."), str);
2801 (void) restore_line_pointer (e);
2802 }
2803 else
2804 as_bad (_("missing argument for %s_check directive"), str);
2805
2806 demand_empty_rest_of_line ();
2807 }
2808
2809 static void
2810 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2811 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2812 {
2813 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2814 static const char *arch;
2815
2816 /* Intel LIOM is only supported on ELF. */
2817 if (!IS_ELF)
2818 return;
2819
2820 if (!arch)
2821 {
2822 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2823 use default_arch. */
2824 arch = cpu_arch_name;
2825 if (!arch)
2826 arch = default_arch;
2827 }
2828
2829 /* If we are targeting Intel MCU, we must enable it. */
2830 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2831 || new_flag.bitfield.cpuiamcu)
2832 return;
2833
2834 /* If we are targeting Intel L1OM, we must enable it. */
2835 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2836 || new_flag.bitfield.cpul1om)
2837 return;
2838
2839 /* If we are targeting Intel K1OM, we must enable it. */
2840 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2841 || new_flag.bitfield.cpuk1om)
2842 return;
2843
2844 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2845 #endif
2846 }
2847
2848 static void
2849 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2850 {
2851 SKIP_WHITESPACE ();
2852
2853 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2854 {
2855 char *string;
2856 int e = get_symbol_name (&string);
2857 unsigned int j;
2858 i386_cpu_flags flags;
2859
2860 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2861 {
2862 if (strcmp (string, cpu_arch[j].name) == 0)
2863 {
2864 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2865
2866 if (*string != '.')
2867 {
2868 cpu_arch_name = cpu_arch[j].name;
2869 cpu_sub_arch_name = NULL;
2870 cpu_arch_flags = cpu_arch[j].flags;
2871 if (flag_code == CODE_64BIT)
2872 {
2873 cpu_arch_flags.bitfield.cpu64 = 1;
2874 cpu_arch_flags.bitfield.cpuno64 = 0;
2875 }
2876 else
2877 {
2878 cpu_arch_flags.bitfield.cpu64 = 0;
2879 cpu_arch_flags.bitfield.cpuno64 = 1;
2880 }
2881 cpu_arch_isa = cpu_arch[j].type;
2882 cpu_arch_isa_flags = cpu_arch[j].flags;
2883 if (!cpu_arch_tune_set)
2884 {
2885 cpu_arch_tune = cpu_arch_isa;
2886 cpu_arch_tune_flags = cpu_arch_isa_flags;
2887 }
2888 break;
2889 }
2890
2891 flags = cpu_flags_or (cpu_arch_flags,
2892 cpu_arch[j].flags);
2893
2894 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2895 {
2896 if (cpu_sub_arch_name)
2897 {
2898 char *name = cpu_sub_arch_name;
2899 cpu_sub_arch_name = concat (name,
2900 cpu_arch[j].name,
2901 (const char *) NULL);
2902 free (name);
2903 }
2904 else
2905 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2906 cpu_arch_flags = flags;
2907 cpu_arch_isa_flags = flags;
2908 }
2909 else
2910 cpu_arch_isa_flags
2911 = cpu_flags_or (cpu_arch_isa_flags,
2912 cpu_arch[j].flags);
2913 (void) restore_line_pointer (e);
2914 demand_empty_rest_of_line ();
2915 return;
2916 }
2917 }
2918
2919 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2920 {
2921 /* Disable an ISA extension. */
2922 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2923 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2924 {
2925 flags = cpu_flags_and_not (cpu_arch_flags,
2926 cpu_noarch[j].flags);
2927 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2928 {
2929 if (cpu_sub_arch_name)
2930 {
2931 char *name = cpu_sub_arch_name;
2932 cpu_sub_arch_name = concat (name, string,
2933 (const char *) NULL);
2934 free (name);
2935 }
2936 else
2937 cpu_sub_arch_name = xstrdup (string);
2938 cpu_arch_flags = flags;
2939 cpu_arch_isa_flags = flags;
2940 }
2941 (void) restore_line_pointer (e);
2942 demand_empty_rest_of_line ();
2943 return;
2944 }
2945
2946 j = ARRAY_SIZE (cpu_arch);
2947 }
2948
2949 if (j >= ARRAY_SIZE (cpu_arch))
2950 as_bad (_("no such architecture: `%s'"), string);
2951
2952 *input_line_pointer = e;
2953 }
2954 else
2955 as_bad (_("missing cpu architecture"));
2956
2957 no_cond_jump_promotion = 0;
2958 if (*input_line_pointer == ','
2959 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2960 {
2961 char *string;
2962 char e;
2963
2964 ++input_line_pointer;
2965 e = get_symbol_name (&string);
2966
2967 if (strcmp (string, "nojumps") == 0)
2968 no_cond_jump_promotion = 1;
2969 else if (strcmp (string, "jumps") == 0)
2970 ;
2971 else
2972 as_bad (_("no such architecture modifier: `%s'"), string);
2973
2974 (void) restore_line_pointer (e);
2975 }
2976
2977 demand_empty_rest_of_line ();
2978 }
2979
2980 enum bfd_architecture
2981 i386_arch (void)
2982 {
2983 if (cpu_arch_isa == PROCESSOR_L1OM)
2984 {
2985 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986 || flag_code != CODE_64BIT)
2987 as_fatal (_("Intel L1OM is 64bit ELF only"));
2988 return bfd_arch_l1om;
2989 }
2990 else if (cpu_arch_isa == PROCESSOR_K1OM)
2991 {
2992 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993 || flag_code != CODE_64BIT)
2994 as_fatal (_("Intel K1OM is 64bit ELF only"));
2995 return bfd_arch_k1om;
2996 }
2997 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2998 {
2999 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3000 || flag_code == CODE_64BIT)
3001 as_fatal (_("Intel MCU is 32bit ELF only"));
3002 return bfd_arch_iamcu;
3003 }
3004 else
3005 return bfd_arch_i386;
3006 }
3007
3008 unsigned long
3009 i386_mach (void)
3010 {
3011 if (!strncmp (default_arch, "x86_64", 6))
3012 {
3013 if (cpu_arch_isa == PROCESSOR_L1OM)
3014 {
3015 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3016 || default_arch[6] != '\0')
3017 as_fatal (_("Intel L1OM is 64bit ELF only"));
3018 return bfd_mach_l1om;
3019 }
3020 else if (cpu_arch_isa == PROCESSOR_K1OM)
3021 {
3022 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3023 || default_arch[6] != '\0')
3024 as_fatal (_("Intel K1OM is 64bit ELF only"));
3025 return bfd_mach_k1om;
3026 }
3027 else if (default_arch[6] == '\0')
3028 return bfd_mach_x86_64;
3029 else
3030 return bfd_mach_x64_32;
3031 }
3032 else if (!strcmp (default_arch, "i386")
3033 || !strcmp (default_arch, "iamcu"))
3034 {
3035 if (cpu_arch_isa == PROCESSOR_IAMCU)
3036 {
3037 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3038 as_fatal (_("Intel MCU is 32bit ELF only"));
3039 return bfd_mach_i386_iamcu;
3040 }
3041 else
3042 return bfd_mach_i386_i386;
3043 }
3044 else
3045 as_fatal (_("unknown architecture"));
3046 }
3047 \f
3048 void
3049 md_begin (void)
3050 {
3051 /* Support pseudo prefixes like {disp32}. */
3052 lex_type ['{'] = LEX_BEGIN_NAME;
3053
3054 /* Initialize op_hash hash table. */
3055 op_hash = str_htab_create ();
3056
3057 {
3058 const insn_template *optab;
3059 templates *core_optab;
3060
3061 /* Setup for loop. */
3062 optab = i386_optab;
3063 core_optab = XNEW (templates);
3064 core_optab->start = optab;
3065
3066 while (1)
3067 {
3068 ++optab;
3069 if (optab->name == NULL
3070 || strcmp (optab->name, (optab - 1)->name) != 0)
3071 {
3072 /* different name --> ship out current template list;
3073 add to hash table; & begin anew. */
3074 core_optab->end = optab;
3075 if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3076 as_fatal (_("duplicate %s"), (optab - 1)->name);
3077
3078 if (optab->name == NULL)
3079 break;
3080 core_optab = XNEW (templates);
3081 core_optab->start = optab;
3082 }
3083 }
3084 }
3085
3086 /* Initialize reg_hash hash table. */
3087 reg_hash = str_htab_create ();
3088 {
3089 const reg_entry *regtab;
3090 unsigned int regtab_size = i386_regtab_size;
3091
3092 for (regtab = i386_regtab; regtab_size--; regtab++)
3093 if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3094 as_fatal (_("duplicate %s"), regtab->reg_name);
3095 }
3096
3097 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3098 {
3099 int c;
3100 char *p;
3101
3102 for (c = 0; c < 256; c++)
3103 {
3104 if (ISDIGIT (c))
3105 {
3106 digit_chars[c] = c;
3107 mnemonic_chars[c] = c;
3108 register_chars[c] = c;
3109 operand_chars[c] = c;
3110 }
3111 else if (ISLOWER (c))
3112 {
3113 mnemonic_chars[c] = c;
3114 register_chars[c] = c;
3115 operand_chars[c] = c;
3116 }
3117 else if (ISUPPER (c))
3118 {
3119 mnemonic_chars[c] = TOLOWER (c);
3120 register_chars[c] = mnemonic_chars[c];
3121 operand_chars[c] = c;
3122 }
3123 else if (c == '{' || c == '}')
3124 {
3125 mnemonic_chars[c] = c;
3126 operand_chars[c] = c;
3127 }
3128 #ifdef SVR4_COMMENT_CHARS
3129 else if (c == '\\' && strchr (i386_comment_chars, '/'))
3130 operand_chars[c] = c;
3131 #endif
3132
3133 if (ISALPHA (c) || ISDIGIT (c))
3134 identifier_chars[c] = c;
3135 else if (c >= 128)
3136 {
3137 identifier_chars[c] = c;
3138 operand_chars[c] = c;
3139 }
3140 }
3141
3142 #ifdef LEX_AT
3143 identifier_chars['@'] = '@';
3144 #endif
3145 #ifdef LEX_QM
3146 identifier_chars['?'] = '?';
3147 operand_chars['?'] = '?';
3148 #endif
3149 digit_chars['-'] = '-';
3150 mnemonic_chars['_'] = '_';
3151 mnemonic_chars['-'] = '-';
3152 mnemonic_chars['.'] = '.';
3153 identifier_chars['_'] = '_';
3154 identifier_chars['.'] = '.';
3155
3156 for (p = operand_special_chars; *p != '\0'; p++)
3157 operand_chars[(unsigned char) *p] = *p;
3158 }
3159
3160 if (flag_code == CODE_64BIT)
3161 {
3162 #if defined (OBJ_COFF) && defined (TE_PE)
3163 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3164 ? 32 : 16);
3165 #else
3166 x86_dwarf2_return_column = 16;
3167 #endif
3168 x86_cie_data_alignment = -8;
3169 }
3170 else
3171 {
3172 x86_dwarf2_return_column = 8;
3173 x86_cie_data_alignment = -4;
3174 }
3175
3176 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3177 can be turned into BRANCH_PREFIX frag. */
3178 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3179 abort ();
3180 }
3181
3182 void
3183 i386_print_statistics (FILE *file)
3184 {
3185 htab_print_statistics (file, "i386 opcode", op_hash);
3186 htab_print_statistics (file, "i386 register", reg_hash);
3187 }
3188 \f
3189 #ifdef DEBUG386
3190
3191 /* Debugging routines for md_assemble. */
3192 static void pte (insn_template *);
3193 static void pt (i386_operand_type);
3194 static void pe (expressionS *);
3195 static void ps (symbolS *);
3196
3197 static void
3198 pi (const char *line, i386_insn *x)
3199 {
3200 unsigned int j;
3201
3202 fprintf (stdout, "%s: template ", line);
3203 pte (&x->tm);
3204 fprintf (stdout, " address: base %s index %s scale %x\n",
3205 x->base_reg ? x->base_reg->reg_name : "none",
3206 x->index_reg ? x->index_reg->reg_name : "none",
3207 x->log2_scale_factor);
3208 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3209 x->rm.mode, x->rm.reg, x->rm.regmem);
3210 fprintf (stdout, " sib: base %x index %x scale %x\n",
3211 x->sib.base, x->sib.index, x->sib.scale);
3212 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3213 (x->rex & REX_W) != 0,
3214 (x->rex & REX_R) != 0,
3215 (x->rex & REX_X) != 0,
3216 (x->rex & REX_B) != 0);
3217 for (j = 0; j < x->operands; j++)
3218 {
3219 fprintf (stdout, " #%d: ", j + 1);
3220 pt (x->types[j]);
3221 fprintf (stdout, "\n");
3222 if (x->types[j].bitfield.class == Reg
3223 || x->types[j].bitfield.class == RegMMX
3224 || x->types[j].bitfield.class == RegSIMD
3225 || x->types[j].bitfield.class == RegMask
3226 || x->types[j].bitfield.class == SReg
3227 || x->types[j].bitfield.class == RegCR
3228 || x->types[j].bitfield.class == RegDR
3229 || x->types[j].bitfield.class == RegTR
3230 || x->types[j].bitfield.class == RegBND)
3231 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3232 if (operand_type_check (x->types[j], imm))
3233 pe (x->op[j].imms);
3234 if (operand_type_check (x->types[j], disp))
3235 pe (x->op[j].disps);
3236 }
3237 }
3238
3239 static void
3240 pte (insn_template *t)
3241 {
3242 unsigned int j;
3243 fprintf (stdout, " %d operands ", t->operands);
3244 fprintf (stdout, "opcode %x ", t->base_opcode);
3245 if (t->extension_opcode != None)
3246 fprintf (stdout, "ext %x ", t->extension_opcode);
3247 if (t->opcode_modifier.d)
3248 fprintf (stdout, "D");
3249 if (t->opcode_modifier.w)
3250 fprintf (stdout, "W");
3251 fprintf (stdout, "\n");
3252 for (j = 0; j < t->operands; j++)
3253 {
3254 fprintf (stdout, " #%d type ", j + 1);
3255 pt (t->operand_types[j]);
3256 fprintf (stdout, "\n");
3257 }
3258 }
3259
3260 static void
3261 pe (expressionS *e)
3262 {
3263 fprintf (stdout, " operation %d\n", e->X_op);
3264 fprintf (stdout, " add_number %ld (%lx)\n",
3265 (long) e->X_add_number, (long) e->X_add_number);
3266 if (e->X_add_symbol)
3267 {
3268 fprintf (stdout, " add_symbol ");
3269 ps (e->X_add_symbol);
3270 fprintf (stdout, "\n");
3271 }
3272 if (e->X_op_symbol)
3273 {
3274 fprintf (stdout, " op_symbol ");
3275 ps (e->X_op_symbol);
3276 fprintf (stdout, "\n");
3277 }
3278 }
3279
3280 static void
3281 ps (symbolS *s)
3282 {
3283 fprintf (stdout, "%s type %s%s",
3284 S_GET_NAME (s),
3285 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3286 segment_name (S_GET_SEGMENT (s)));
3287 }
3288
3289 static struct type_name
3290 {
3291 i386_operand_type mask;
3292 const char *name;
3293 }
3294 const type_names[] =
3295 {
3296 { OPERAND_TYPE_REG8, "r8" },
3297 { OPERAND_TYPE_REG16, "r16" },
3298 { OPERAND_TYPE_REG32, "r32" },
3299 { OPERAND_TYPE_REG64, "r64" },
3300 { OPERAND_TYPE_ACC8, "acc8" },
3301 { OPERAND_TYPE_ACC16, "acc16" },
3302 { OPERAND_TYPE_ACC32, "acc32" },
3303 { OPERAND_TYPE_ACC64, "acc64" },
3304 { OPERAND_TYPE_IMM8, "i8" },
3305 { OPERAND_TYPE_IMM8, "i8s" },
3306 { OPERAND_TYPE_IMM16, "i16" },
3307 { OPERAND_TYPE_IMM32, "i32" },
3308 { OPERAND_TYPE_IMM32S, "i32s" },
3309 { OPERAND_TYPE_IMM64, "i64" },
3310 { OPERAND_TYPE_IMM1, "i1" },
3311 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3312 { OPERAND_TYPE_DISP8, "d8" },
3313 { OPERAND_TYPE_DISP16, "d16" },
3314 { OPERAND_TYPE_DISP32, "d32" },
3315 { OPERAND_TYPE_DISP32S, "d32s" },
3316 { OPERAND_TYPE_DISP64, "d64" },
3317 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3318 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3319 { OPERAND_TYPE_CONTROL, "control reg" },
3320 { OPERAND_TYPE_TEST, "test reg" },
3321 { OPERAND_TYPE_DEBUG, "debug reg" },
3322 { OPERAND_TYPE_FLOATREG, "FReg" },
3323 { OPERAND_TYPE_FLOATACC, "FAcc" },
3324 { OPERAND_TYPE_SREG, "SReg" },
3325 { OPERAND_TYPE_REGMMX, "rMMX" },
3326 { OPERAND_TYPE_REGXMM, "rXMM" },
3327 { OPERAND_TYPE_REGYMM, "rYMM" },
3328 { OPERAND_TYPE_REGZMM, "rZMM" },
3329 { OPERAND_TYPE_REGTMM, "rTMM" },
3330 { OPERAND_TYPE_REGMASK, "Mask reg" },
3331 };
3332
3333 static void
3334 pt (i386_operand_type t)
3335 {
3336 unsigned int j;
3337 i386_operand_type a;
3338
3339 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3340 {
3341 a = operand_type_and (t, type_names[j].mask);
3342 if (operand_type_equal (&a, &type_names[j].mask))
3343 fprintf (stdout, "%s, ", type_names[j].name);
3344 }
3345 fflush (stdout);
3346 }
3347
3348 #endif /* DEBUG386 */
3349 \f
3350 static bfd_reloc_code_real_type
3351 reloc (unsigned int size,
3352 int pcrel,
3353 int sign,
3354 bfd_reloc_code_real_type other)
3355 {
3356 if (other != NO_RELOC)
3357 {
3358 reloc_howto_type *rel;
3359
3360 if (size == 8)
3361 switch (other)
3362 {
3363 case BFD_RELOC_X86_64_GOT32:
3364 return BFD_RELOC_X86_64_GOT64;
3365 break;
3366 case BFD_RELOC_X86_64_GOTPLT64:
3367 return BFD_RELOC_X86_64_GOTPLT64;
3368 break;
3369 case BFD_RELOC_X86_64_PLTOFF64:
3370 return BFD_RELOC_X86_64_PLTOFF64;
3371 break;
3372 case BFD_RELOC_X86_64_GOTPC32:
3373 other = BFD_RELOC_X86_64_GOTPC64;
3374 break;
3375 case BFD_RELOC_X86_64_GOTPCREL:
3376 other = BFD_RELOC_X86_64_GOTPCREL64;
3377 break;
3378 case BFD_RELOC_X86_64_TPOFF32:
3379 other = BFD_RELOC_X86_64_TPOFF64;
3380 break;
3381 case BFD_RELOC_X86_64_DTPOFF32:
3382 other = BFD_RELOC_X86_64_DTPOFF64;
3383 break;
3384 default:
3385 break;
3386 }
3387
3388 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3389 if (other == BFD_RELOC_SIZE32)
3390 {
3391 if (size == 8)
3392 other = BFD_RELOC_SIZE64;
3393 if (pcrel)
3394 {
3395 as_bad (_("there are no pc-relative size relocations"));
3396 return NO_RELOC;
3397 }
3398 }
3399 #endif
3400
3401 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3402 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3403 sign = -1;
3404
3405 rel = bfd_reloc_type_lookup (stdoutput, other);
3406 if (!rel)
3407 as_bad (_("unknown relocation (%u)"), other);
3408 else if (size != bfd_get_reloc_size (rel))
3409 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3410 bfd_get_reloc_size (rel),
3411 size);
3412 else if (pcrel && !rel->pc_relative)
3413 as_bad (_("non-pc-relative relocation for pc-relative field"));
3414 else if ((rel->complain_on_overflow == complain_overflow_signed
3415 && !sign)
3416 || (rel->complain_on_overflow == complain_overflow_unsigned
3417 && sign > 0))
3418 as_bad (_("relocated field and relocation type differ in signedness"));
3419 else
3420 return other;
3421 return NO_RELOC;
3422 }
3423
3424 if (pcrel)
3425 {
3426 if (!sign)
3427 as_bad (_("there are no unsigned pc-relative relocations"));
3428 switch (size)
3429 {
3430 case 1: return BFD_RELOC_8_PCREL;
3431 case 2: return BFD_RELOC_16_PCREL;
3432 case 4: return BFD_RELOC_32_PCREL;
3433 case 8: return BFD_RELOC_64_PCREL;
3434 }
3435 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3436 }
3437 else
3438 {
3439 if (sign > 0)
3440 switch (size)
3441 {
3442 case 4: return BFD_RELOC_X86_64_32S;
3443 }
3444 else
3445 switch (size)
3446 {
3447 case 1: return BFD_RELOC_8;
3448 case 2: return BFD_RELOC_16;
3449 case 4: return BFD_RELOC_32;
3450 case 8: return BFD_RELOC_64;
3451 }
3452 as_bad (_("cannot do %s %u byte relocation"),
3453 sign > 0 ? "signed" : "unsigned", size);
3454 }
3455
3456 return NO_RELOC;
3457 }
3458
3459 /* Here we decide which fixups can be adjusted to make them relative to
3460 the beginning of the section instead of the symbol. Basically we need
3461 to make sure that the dynamic relocations are done correctly, so in
3462 some cases we force the original symbol to be used. */
3463
3464 int
3465 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3466 {
3467 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3468 if (!IS_ELF)
3469 return 1;
3470
3471 /* Don't adjust pc-relative references to merge sections in 64-bit
3472 mode. */
3473 if (use_rela_relocations
3474 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3475 && fixP->fx_pcrel)
3476 return 0;
3477
3478 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3479 and changed later by validate_fix. */
3480 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3481 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3482 return 0;
3483
3484 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3485 for size relocations. */
3486 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3487 || fixP->fx_r_type == BFD_RELOC_SIZE64
3488 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3489 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3490 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3491 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3492 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3493 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3494 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3495 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3496 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3497 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3498 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3499 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3500 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3501 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3502 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3503 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3504 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3505 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3506 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3507 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3508 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3509 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3510 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3511 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3512 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3513 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3514 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3515 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3516 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3517 return 0;
3518 #endif
3519 return 1;
3520 }
3521
3522 static int
3523 intel_float_operand (const char *mnemonic)
3524 {
3525 /* Note that the value returned is meaningful only for opcodes with (memory)
3526 operands, hence the code here is free to improperly handle opcodes that
3527 have no operands (for better performance and smaller code). */
3528
3529 if (mnemonic[0] != 'f')
3530 return 0; /* non-math */
3531
3532 switch (mnemonic[1])
3533 {
3534 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3535 the fs segment override prefix not currently handled because no
3536 call path can make opcodes without operands get here */
3537 case 'i':
3538 return 2 /* integer op */;
3539 case 'l':
3540 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3541 return 3; /* fldcw/fldenv */
3542 break;
3543 case 'n':
3544 if (mnemonic[2] != 'o' /* fnop */)
3545 return 3; /* non-waiting control op */
3546 break;
3547 case 'r':
3548 if (mnemonic[2] == 's')
3549 return 3; /* frstor/frstpm */
3550 break;
3551 case 's':
3552 if (mnemonic[2] == 'a')
3553 return 3; /* fsave */
3554 if (mnemonic[2] == 't')
3555 {
3556 switch (mnemonic[3])
3557 {
3558 case 'c': /* fstcw */
3559 case 'd': /* fstdw */
3560 case 'e': /* fstenv */
3561 case 's': /* fsts[gw] */
3562 return 3;
3563 }
3564 }
3565 break;
3566 case 'x':
3567 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3568 return 0; /* fxsave/fxrstor are not really math ops */
3569 break;
3570 }
3571
3572 return 1;
3573 }
3574
3575 /* Build the VEX prefix. */
3576
3577 static void
3578 build_vex_prefix (const insn_template *t)
3579 {
3580 unsigned int register_specifier;
3581 unsigned int implied_prefix;
3582 unsigned int vector_length;
3583 unsigned int w;
3584
3585 /* Check register specifier. */
3586 if (i.vex.register_specifier)
3587 {
3588 register_specifier =
3589 ~register_number (i.vex.register_specifier) & 0xf;
3590 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3591 }
3592 else
3593 register_specifier = 0xf;
3594
3595 /* Use 2-byte VEX prefix by swapping destination and source operand
3596 if there are more than 1 register operand. */
3597 if (i.reg_operands > 1
3598 && i.vec_encoding != vex_encoding_vex3
3599 && i.dir_encoding == dir_encoding_default
3600 && i.operands == i.reg_operands
3601 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3602 && i.tm.opcode_modifier.opcodeprefix == VEX0F
3603 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3604 && i.rex == REX_B)
3605 {
3606 unsigned int xchg = i.operands - 1;
3607 union i386_op temp_op;
3608 i386_operand_type temp_type;
3609
3610 temp_type = i.types[xchg];
3611 i.types[xchg] = i.types[0];
3612 i.types[0] = temp_type;
3613 temp_op = i.op[xchg];
3614 i.op[xchg] = i.op[0];
3615 i.op[0] = temp_op;
3616
3617 gas_assert (i.rm.mode == 3);
3618
3619 i.rex = REX_R;
3620 xchg = i.rm.regmem;
3621 i.rm.regmem = i.rm.reg;
3622 i.rm.reg = xchg;
3623
3624 if (i.tm.opcode_modifier.d)
3625 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3626 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3627 else /* Use the next insn. */
3628 i.tm = t[1];
3629 }
3630
3631 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3632 are no memory operands and at least 3 register ones. */
3633 if (i.reg_operands >= 3
3634 && i.vec_encoding != vex_encoding_vex3
3635 && i.reg_operands == i.operands - i.imm_operands
3636 && i.tm.opcode_modifier.vex
3637 && i.tm.opcode_modifier.commutative
3638 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3639 && i.rex == REX_B
3640 && i.vex.register_specifier
3641 && !(i.vex.register_specifier->reg_flags & RegRex))
3642 {
3643 unsigned int xchg = i.operands - i.reg_operands;
3644 union i386_op temp_op;
3645 i386_operand_type temp_type;
3646
3647 gas_assert (i.tm.opcode_modifier.opcodeprefix == VEX0F);
3648 gas_assert (!i.tm.opcode_modifier.sae);
3649 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3650 &i.types[i.operands - 3]));
3651 gas_assert (i.rm.mode == 3);
3652
3653 temp_type = i.types[xchg];
3654 i.types[xchg] = i.types[xchg + 1];
3655 i.types[xchg + 1] = temp_type;
3656 temp_op = i.op[xchg];
3657 i.op[xchg] = i.op[xchg + 1];
3658 i.op[xchg + 1] = temp_op;
3659
3660 i.rex = 0;
3661 xchg = i.rm.regmem | 8;
3662 i.rm.regmem = ~register_specifier & 0xf;
3663 gas_assert (!(i.rm.regmem & 8));
3664 i.vex.register_specifier += xchg - i.rm.regmem;
3665 register_specifier = ~xchg & 0xf;
3666 }
3667
3668 if (i.tm.opcode_modifier.vex == VEXScalar)
3669 vector_length = avxscalar;
3670 else if (i.tm.opcode_modifier.vex == VEX256)
3671 vector_length = 1;
3672 else
3673 {
3674 unsigned int op;
3675
3676 /* Determine vector length from the last multi-length vector
3677 operand. */
3678 vector_length = 0;
3679 for (op = t->operands; op--;)
3680 if (t->operand_types[op].bitfield.xmmword
3681 && t->operand_types[op].bitfield.ymmword
3682 && i.types[op].bitfield.ymmword)
3683 {
3684 vector_length = 1;
3685 break;
3686 }
3687 }
3688
3689 switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
3690 {
3691 case 0:
3692 implied_prefix = 0;
3693 break;
3694 case DATA_PREFIX_OPCODE:
3695 implied_prefix = 1;
3696 break;
3697 case REPE_PREFIX_OPCODE:
3698 implied_prefix = 2;
3699 break;
3700 case REPNE_PREFIX_OPCODE:
3701 implied_prefix = 3;
3702 break;
3703 default:
3704 abort ();
3705 }
3706
3707 /* Check the REX.W bit and VEXW. */
3708 if (i.tm.opcode_modifier.vexw == VEXWIG)
3709 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3710 else if (i.tm.opcode_modifier.vexw)
3711 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3712 else
3713 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3714
3715 /* Use 2-byte VEX prefix if possible. */
3716 if (w == 0
3717 && i.vec_encoding != vex_encoding_vex3
3718 && i.tm.opcode_modifier.opcodeprefix == VEX0F
3719 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3720 {
3721 /* 2-byte VEX prefix. */
3722 unsigned int r;
3723
3724 i.vex.length = 2;
3725 i.vex.bytes[0] = 0xc5;
3726
3727 /* Check the REX.R bit. */
3728 r = (i.rex & REX_R) ? 0 : 1;
3729 i.vex.bytes[1] = (r << 7
3730 | register_specifier << 3
3731 | vector_length << 2
3732 | implied_prefix);
3733 }
3734 else
3735 {
3736 /* 3-byte VEX prefix. */
3737 unsigned int m;
3738
3739 i.vex.length = 3;
3740
3741 switch (i.tm.opcode_modifier.opcodeprefix)
3742 {
3743 case VEX0F:
3744 m = 0x1;
3745 i.vex.bytes[0] = 0xc4;
3746 break;
3747 case VEX0F38:
3748 m = 0x2;
3749 i.vex.bytes[0] = 0xc4;
3750 break;
3751 case VEX0F3A:
3752 m = 0x3;
3753 i.vex.bytes[0] = 0xc4;
3754 break;
3755 case XOP08:
3756 m = 0x8;
3757 i.vex.bytes[0] = 0x8f;
3758 break;
3759 case XOP09:
3760 m = 0x9;
3761 i.vex.bytes[0] = 0x8f;
3762 break;
3763 case XOP0A:
3764 m = 0xa;
3765 i.vex.bytes[0] = 0x8f;
3766 break;
3767 default:
3768 abort ();
3769 }
3770
3771 /* The high 3 bits of the second VEX byte are 1's compliment
3772 of RXB bits from REX. */
3773 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3774
3775 i.vex.bytes[2] = (w << 7
3776 | register_specifier << 3
3777 | vector_length << 2
3778 | implied_prefix);
3779 }
3780 }
3781
3782 static INLINE bfd_boolean
3783 is_evex_encoding (const insn_template *t)
3784 {
3785 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3786 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3787 || t->opcode_modifier.sae;
3788 }
3789
3790 static INLINE bfd_boolean
3791 is_any_vex_encoding (const insn_template *t)
3792 {
3793 return t->opcode_modifier.vex || is_evex_encoding (t);
3794 }
3795
3796 /* Build the EVEX prefix. */
3797
3798 static void
3799 build_evex_prefix (void)
3800 {
3801 unsigned int register_specifier;
3802 unsigned int implied_prefix;
3803 unsigned int m, w;
3804 rex_byte vrex_used = 0;
3805
3806 /* Check register specifier. */
3807 if (i.vex.register_specifier)
3808 {
3809 gas_assert ((i.vrex & REX_X) == 0);
3810
3811 register_specifier = i.vex.register_specifier->reg_num;
3812 if ((i.vex.register_specifier->reg_flags & RegRex))
3813 register_specifier += 8;
3814 /* The upper 16 registers are encoded in the fourth byte of the
3815 EVEX prefix. */
3816 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3817 i.vex.bytes[3] = 0x8;
3818 register_specifier = ~register_specifier & 0xf;
3819 }
3820 else
3821 {
3822 register_specifier = 0xf;
3823
3824 /* Encode upper 16 vector index register in the fourth byte of
3825 the EVEX prefix. */
3826 if (!(i.vrex & REX_X))
3827 i.vex.bytes[3] = 0x8;
3828 else
3829 vrex_used |= REX_X;
3830 }
3831
3832 switch ((i.tm.base_opcode >> 8) & 0xff)
3833 {
3834 case 0:
3835 implied_prefix = 0;
3836 break;
3837 case DATA_PREFIX_OPCODE:
3838 implied_prefix = 1;
3839 break;
3840 case REPE_PREFIX_OPCODE:
3841 implied_prefix = 2;
3842 break;
3843 case REPNE_PREFIX_OPCODE:
3844 implied_prefix = 3;
3845 break;
3846 default:
3847 abort ();
3848 }
3849
3850 /* 4 byte EVEX prefix. */
3851 i.vex.length = 4;
3852 i.vex.bytes[0] = 0x62;
3853
3854 /* mmmm bits. */
3855 switch (i.tm.opcode_modifier.opcodeprefix)
3856 {
3857 case VEX0F:
3858 m = 1;
3859 break;
3860 case VEX0F38:
3861 m = 2;
3862 break;
3863 case VEX0F3A:
3864 m = 3;
3865 break;
3866 default:
3867 abort ();
3868 break;
3869 }
3870
3871 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3872 bits from REX. */
3873 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3874
3875 /* The fifth bit of the second EVEX byte is 1's compliment of the
3876 REX_R bit in VREX. */
3877 if (!(i.vrex & REX_R))
3878 i.vex.bytes[1] |= 0x10;
3879 else
3880 vrex_used |= REX_R;
3881
3882 if ((i.reg_operands + i.imm_operands) == i.operands)
3883 {
3884 /* When all operands are registers, the REX_X bit in REX is not
3885 used. We reuse it to encode the upper 16 registers, which is
3886 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3887 as 1's compliment. */
3888 if ((i.vrex & REX_B))
3889 {
3890 vrex_used |= REX_B;
3891 i.vex.bytes[1] &= ~0x40;
3892 }
3893 }
3894
3895 /* EVEX instructions shouldn't need the REX prefix. */
3896 i.vrex &= ~vrex_used;
3897 gas_assert (i.vrex == 0);
3898
3899 /* Check the REX.W bit and VEXW. */
3900 if (i.tm.opcode_modifier.vexw == VEXWIG)
3901 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3902 else if (i.tm.opcode_modifier.vexw)
3903 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3904 else
3905 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3906
3907 /* Encode the U bit. */
3908 implied_prefix |= 0x4;
3909
3910 /* The third byte of the EVEX prefix. */
3911 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3912
3913 /* The fourth byte of the EVEX prefix. */
3914 /* The zeroing-masking bit. */
3915 if (i.mask && i.mask->zeroing)
3916 i.vex.bytes[3] |= 0x80;
3917
3918 /* Don't always set the broadcast bit if there is no RC. */
3919 if (!i.rounding)
3920 {
3921 /* Encode the vector length. */
3922 unsigned int vec_length;
3923
3924 if (!i.tm.opcode_modifier.evex
3925 || i.tm.opcode_modifier.evex == EVEXDYN)
3926 {
3927 unsigned int op;
3928
3929 /* Determine vector length from the last multi-length vector
3930 operand. */
3931 for (op = i.operands; op--;)
3932 if (i.tm.operand_types[op].bitfield.xmmword
3933 + i.tm.operand_types[op].bitfield.ymmword
3934 + i.tm.operand_types[op].bitfield.zmmword > 1)
3935 {
3936 if (i.types[op].bitfield.zmmword)
3937 {
3938 i.tm.opcode_modifier.evex = EVEX512;
3939 break;
3940 }
3941 else if (i.types[op].bitfield.ymmword)
3942 {
3943 i.tm.opcode_modifier.evex = EVEX256;
3944 break;
3945 }
3946 else if (i.types[op].bitfield.xmmword)
3947 {
3948 i.tm.opcode_modifier.evex = EVEX128;
3949 break;
3950 }
3951 else if (i.broadcast && (int) op == i.broadcast->operand)
3952 {
3953 switch (i.broadcast->bytes)
3954 {
3955 case 64:
3956 i.tm.opcode_modifier.evex = EVEX512;
3957 break;
3958 case 32:
3959 i.tm.opcode_modifier.evex = EVEX256;
3960 break;
3961 case 16:
3962 i.tm.opcode_modifier.evex = EVEX128;
3963 break;
3964 default:
3965 abort ();
3966 }
3967 break;
3968 }
3969 }
3970
3971 if (op >= MAX_OPERANDS)
3972 abort ();
3973 }
3974
3975 switch (i.tm.opcode_modifier.evex)
3976 {
3977 case EVEXLIG: /* LL' is ignored */
3978 vec_length = evexlig << 5;
3979 break;
3980 case EVEX128:
3981 vec_length = 0 << 5;
3982 break;
3983 case EVEX256:
3984 vec_length = 1 << 5;
3985 break;
3986 case EVEX512:
3987 vec_length = 2 << 5;
3988 break;
3989 default:
3990 abort ();
3991 break;
3992 }
3993 i.vex.bytes[3] |= vec_length;
3994 /* Encode the broadcast bit. */
3995 if (i.broadcast)
3996 i.vex.bytes[3] |= 0x10;
3997 }
3998 else
3999 {
4000 if (i.rounding->type != saeonly)
4001 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
4002 else
4003 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
4004 }
4005
4006 if (i.mask && i.mask->mask)
4007 i.vex.bytes[3] |= i.mask->mask->reg_num;
4008 }
4009
4010 static void
4011 process_immext (void)
4012 {
4013 expressionS *exp;
4014
4015 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
4016 which is coded in the same place as an 8-bit immediate field
4017 would be. Here we fake an 8-bit immediate operand from the
4018 opcode suffix stored in tm.extension_opcode.
4019
4020 AVX instructions also use this encoding, for some of
4021 3 argument instructions. */
4022
4023 gas_assert (i.imm_operands <= 1
4024 && (i.operands <= 2
4025 || (is_any_vex_encoding (&i.tm)
4026 && i.operands <= 4)));
4027
4028 exp = &im_expressions[i.imm_operands++];
4029 i.op[i.operands].imms = exp;
4030 i.types[i.operands] = imm8;
4031 i.operands++;
4032 exp->X_op = O_constant;
4033 exp->X_add_number = i.tm.extension_opcode;
4034 i.tm.extension_opcode = None;
4035 }
4036
4037
4038 static int
4039 check_hle (void)
4040 {
4041 switch (i.tm.opcode_modifier.prefixok)
4042 {
4043 default:
4044 abort ();
4045 case PrefixLock:
4046 case PrefixNone:
4047 case PrefixNoTrack:
4048 case PrefixRep:
4049 as_bad (_("invalid instruction `%s' after `%s'"),
4050 i.tm.name, i.hle_prefix);
4051 return 0;
4052 case PrefixHLELock:
4053 if (i.prefix[LOCK_PREFIX])
4054 return 1;
4055 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4056 return 0;
4057 case PrefixHLEAny:
4058 return 1;
4059 case PrefixHLERelease:
4060 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4061 {
4062 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4063 i.tm.name);
4064 return 0;
4065 }
4066 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4067 {
4068 as_bad (_("memory destination needed for instruction `%s'"
4069 " after `xrelease'"), i.tm.name);
4070 return 0;
4071 }
4072 return 1;
4073 }
4074 }
4075
4076 /* Try the shortest encoding by shortening operand size. */
4077
4078 static void
4079 optimize_encoding (void)
4080 {
4081 unsigned int j;
4082
4083 if (optimize_for_space
4084 && !is_any_vex_encoding (&i.tm)
4085 && i.reg_operands == 1
4086 && i.imm_operands == 1
4087 && !i.types[1].bitfield.byte
4088 && i.op[0].imms->X_op == O_constant
4089 && fits_in_imm7 (i.op[0].imms->X_add_number)
4090 && (i.tm.base_opcode == 0xa8
4091 || (i.tm.base_opcode == 0xf6
4092 && i.tm.extension_opcode == 0x0)))
4093 {
4094 /* Optimize: -Os:
4095 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4096 */
4097 unsigned int base_regnum = i.op[1].regs->reg_num;
4098 if (flag_code == CODE_64BIT || base_regnum < 4)
4099 {
4100 i.types[1].bitfield.byte = 1;
4101 /* Ignore the suffix. */
4102 i.suffix = 0;
4103 /* Convert to byte registers. */
4104 if (i.types[1].bitfield.word)
4105 j = 16;
4106 else if (i.types[1].bitfield.dword)
4107 j = 32;
4108 else
4109 j = 48;
4110 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4111 j += 8;
4112 i.op[1].regs -= j;
4113 }
4114 }
4115 else if (flag_code == CODE_64BIT
4116 && !is_any_vex_encoding (&i.tm)
4117 && ((i.types[1].bitfield.qword
4118 && i.reg_operands == 1
4119 && i.imm_operands == 1
4120 && i.op[0].imms->X_op == O_constant
4121 && ((i.tm.base_opcode == 0xb8
4122 && i.tm.extension_opcode == None
4123 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4124 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4125 && ((i.tm.base_opcode == 0x24
4126 || i.tm.base_opcode == 0xa8)
4127 || (i.tm.base_opcode == 0x80
4128 && i.tm.extension_opcode == 0x4)
4129 || ((i.tm.base_opcode == 0xf6
4130 || (i.tm.base_opcode | 1) == 0xc7)
4131 && i.tm.extension_opcode == 0x0)))
4132 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4133 && i.tm.base_opcode == 0x83
4134 && i.tm.extension_opcode == 0x4)))
4135 || (i.types[0].bitfield.qword
4136 && ((i.reg_operands == 2
4137 && i.op[0].regs == i.op[1].regs
4138 && (i.tm.base_opcode == 0x30
4139 || i.tm.base_opcode == 0x28))
4140 || (i.reg_operands == 1
4141 && i.operands == 1
4142 && i.tm.base_opcode == 0x30)))))
4143 {
4144 /* Optimize: -O:
4145 andq $imm31, %r64 -> andl $imm31, %r32
4146 andq $imm7, %r64 -> andl $imm7, %r32
4147 testq $imm31, %r64 -> testl $imm31, %r32
4148 xorq %r64, %r64 -> xorl %r32, %r32
4149 subq %r64, %r64 -> subl %r32, %r32
4150 movq $imm31, %r64 -> movl $imm31, %r32
4151 movq $imm32, %r64 -> movl $imm32, %r32
4152 */
4153 i.tm.opcode_modifier.norex64 = 1;
4154 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4155 {
4156 /* Handle
4157 movq $imm31, %r64 -> movl $imm31, %r32
4158 movq $imm32, %r64 -> movl $imm32, %r32
4159 */
4160 i.tm.operand_types[0].bitfield.imm32 = 1;
4161 i.tm.operand_types[0].bitfield.imm32s = 0;
4162 i.tm.operand_types[0].bitfield.imm64 = 0;
4163 i.types[0].bitfield.imm32 = 1;
4164 i.types[0].bitfield.imm32s = 0;
4165 i.types[0].bitfield.imm64 = 0;
4166 i.types[1].bitfield.dword = 1;
4167 i.types[1].bitfield.qword = 0;
4168 if ((i.tm.base_opcode | 1) == 0xc7)
4169 {
4170 /* Handle
4171 movq $imm31, %r64 -> movl $imm31, %r32
4172 */
4173 i.tm.base_opcode = 0xb8;
4174 i.tm.extension_opcode = None;
4175 i.tm.opcode_modifier.w = 0;
4176 i.tm.opcode_modifier.modrm = 0;
4177 }
4178 }
4179 }
4180 else if (optimize > 1
4181 && !optimize_for_space
4182 && !is_any_vex_encoding (&i.tm)
4183 && i.reg_operands == 2
4184 && i.op[0].regs == i.op[1].regs
4185 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4186 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4187 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4188 {
4189 /* Optimize: -O2:
4190 andb %rN, %rN -> testb %rN, %rN
4191 andw %rN, %rN -> testw %rN, %rN
4192 andq %rN, %rN -> testq %rN, %rN
4193 orb %rN, %rN -> testb %rN, %rN
4194 orw %rN, %rN -> testw %rN, %rN
4195 orq %rN, %rN -> testq %rN, %rN
4196
4197 and outside of 64-bit mode
4198
4199 andl %rN, %rN -> testl %rN, %rN
4200 orl %rN, %rN -> testl %rN, %rN
4201 */
4202 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4203 }
4204 else if (i.reg_operands == 3
4205 && i.op[0].regs == i.op[1].regs
4206 && !i.types[2].bitfield.xmmword
4207 && (i.tm.opcode_modifier.vex
4208 || ((!i.mask || i.mask->zeroing)
4209 && !i.rounding
4210 && is_evex_encoding (&i.tm)
4211 && (i.vec_encoding != vex_encoding_evex
4212 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4213 || i.tm.cpu_flags.bitfield.cpuavx512vl
4214 || (i.tm.operand_types[2].bitfield.zmmword
4215 && i.types[2].bitfield.ymmword))))
4216 && ((i.tm.base_opcode == 0x55
4217 || i.tm.base_opcode == 0x6655
4218 || i.tm.base_opcode == 0x66df
4219 || i.tm.base_opcode == 0x57
4220 || i.tm.base_opcode == 0x6657
4221 || i.tm.base_opcode == 0x66ef
4222 || i.tm.base_opcode == 0x66f8
4223 || i.tm.base_opcode == 0x66f9
4224 || i.tm.base_opcode == 0x66fa
4225 || i.tm.base_opcode == 0x66fb
4226 || i.tm.base_opcode == 0x42
4227 || i.tm.base_opcode == 0x6642
4228 || i.tm.base_opcode == 0x47
4229 || i.tm.base_opcode == 0x6647)
4230 && i.tm.extension_opcode == None))
4231 {
4232 /* Optimize: -O1:
4233 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4234 vpsubq and vpsubw:
4235 EVEX VOP %zmmM, %zmmM, %zmmN
4236 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4237 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4238 EVEX VOP %ymmM, %ymmM, %ymmN
4239 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4240 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4241 VEX VOP %ymmM, %ymmM, %ymmN
4242 -> VEX VOP %xmmM, %xmmM, %xmmN
4243 VOP, one of vpandn and vpxor:
4244 VEX VOP %ymmM, %ymmM, %ymmN
4245 -> VEX VOP %xmmM, %xmmM, %xmmN
4246 VOP, one of vpandnd and vpandnq:
4247 EVEX VOP %zmmM, %zmmM, %zmmN
4248 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4249 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4250 EVEX VOP %ymmM, %ymmM, %ymmN
4251 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4252 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4253 VOP, one of vpxord and vpxorq:
4254 EVEX VOP %zmmM, %zmmM, %zmmN
4255 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4256 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4257 EVEX VOP %ymmM, %ymmM, %ymmN
4258 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4259 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4260 VOP, one of kxord and kxorq:
4261 VEX VOP %kM, %kM, %kN
4262 -> VEX kxorw %kM, %kM, %kN
4263 VOP, one of kandnd and kandnq:
4264 VEX VOP %kM, %kM, %kN
4265 -> VEX kandnw %kM, %kM, %kN
4266 */
4267 if (is_evex_encoding (&i.tm))
4268 {
4269 if (i.vec_encoding != vex_encoding_evex)
4270 {
4271 i.tm.opcode_modifier.vex = VEX128;
4272 i.tm.opcode_modifier.vexw = VEXW0;
4273 i.tm.opcode_modifier.evex = 0;
4274 }
4275 else if (optimize > 1)
4276 i.tm.opcode_modifier.evex = EVEX128;
4277 else
4278 return;
4279 }
4280 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4281 {
4282 i.tm.base_opcode &= 0xff;
4283 i.tm.opcode_modifier.vexw = VEXW0;
4284 }
4285 else
4286 i.tm.opcode_modifier.vex = VEX128;
4287
4288 if (i.tm.opcode_modifier.vex)
4289 for (j = 0; j < 3; j++)
4290 {
4291 i.types[j].bitfield.xmmword = 1;
4292 i.types[j].bitfield.ymmword = 0;
4293 }
4294 }
4295 else if (i.vec_encoding != vex_encoding_evex
4296 && !i.types[0].bitfield.zmmword
4297 && !i.types[1].bitfield.zmmword
4298 && !i.mask
4299 && !i.broadcast
4300 && is_evex_encoding (&i.tm)
4301 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4302 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4303 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4304 || (i.tm.base_opcode & ~4) == 0x66db
4305 || (i.tm.base_opcode & ~4) == 0x66eb)
4306 && i.tm.extension_opcode == None)
4307 {
4308 /* Optimize: -O1:
4309 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4310 vmovdqu32 and vmovdqu64:
4311 EVEX VOP %xmmM, %xmmN
4312 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4313 EVEX VOP %ymmM, %ymmN
4314 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4315 EVEX VOP %xmmM, mem
4316 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4317 EVEX VOP %ymmM, mem
4318 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4319 EVEX VOP mem, %xmmN
4320 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4321 EVEX VOP mem, %ymmN
4322 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4323 VOP, one of vpand, vpandn, vpor, vpxor:
4324 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4325 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4326 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4327 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4328 EVEX VOP{d,q} mem, %xmmM, %xmmN
4329 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4330 EVEX VOP{d,q} mem, %ymmM, %ymmN
4331 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4332 */
4333 for (j = 0; j < i.operands; j++)
4334 if (operand_type_check (i.types[j], disp)
4335 && i.op[j].disps->X_op == O_constant)
4336 {
4337 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4338 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4339 bytes, we choose EVEX Disp8 over VEX Disp32. */
4340 int evex_disp8, vex_disp8;
4341 unsigned int memshift = i.memshift;
4342 offsetT n = i.op[j].disps->X_add_number;
4343
4344 evex_disp8 = fits_in_disp8 (n);
4345 i.memshift = 0;
4346 vex_disp8 = fits_in_disp8 (n);
4347 if (evex_disp8 != vex_disp8)
4348 {
4349 i.memshift = memshift;
4350 return;
4351 }
4352
4353 i.types[j].bitfield.disp8 = vex_disp8;
4354 break;
4355 }
4356 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4357 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4358 i.tm.opcode_modifier.vex
4359 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4360 i.tm.opcode_modifier.vexw = VEXW0;
4361 /* VPAND, VPOR, and VPXOR are commutative. */
4362 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4363 i.tm.opcode_modifier.commutative = 1;
4364 i.tm.opcode_modifier.evex = 0;
4365 i.tm.opcode_modifier.masking = 0;
4366 i.tm.opcode_modifier.broadcast = 0;
4367 i.tm.opcode_modifier.disp8memshift = 0;
4368 i.memshift = 0;
4369 if (j < i.operands)
4370 i.types[j].bitfield.disp8
4371 = fits_in_disp8 (i.op[j].disps->X_add_number);
4372 }
4373 }
4374
4375 /* Return non-zero for load instruction. */
4376
4377 static int
4378 load_insn_p (void)
4379 {
4380 unsigned int dest;
4381 int any_vex_p = is_any_vex_encoding (&i.tm);
4382 unsigned int base_opcode = i.tm.base_opcode | 1;
4383
4384 if (!any_vex_p)
4385 {
4386 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4387 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4388 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4389 if (i.tm.opcode_modifier.anysize)
4390 return 0;
4391
4392 /* pop, popf, popa. */
4393 if (strcmp (i.tm.name, "pop") == 0
4394 || i.tm.base_opcode == 0x9d
4395 || i.tm.base_opcode == 0x61)
4396 return 1;
4397
4398 /* movs, cmps, lods, scas. */
4399 if ((i.tm.base_opcode | 0xb) == 0xaf)
4400 return 1;
4401
4402 /* outs, xlatb. */
4403 if (base_opcode == 0x6f
4404 || i.tm.base_opcode == 0xd7)
4405 return 1;
4406 /* NB: For AMD-specific insns with implicit memory operands,
4407 they're intentionally not covered. */
4408 }
4409
4410 /* No memory operand. */
4411 if (!i.mem_operands)
4412 return 0;
4413
4414 if (any_vex_p)
4415 {
4416 /* vldmxcsr. */
4417 if (i.tm.base_opcode == 0xae
4418 && i.tm.opcode_modifier.vex
4419 && i.tm.opcode_modifier.opcodeprefix == VEX0F
4420 && i.tm.extension_opcode == 2)
4421 return 1;
4422 }
4423 else
4424 {
4425 /* test, not, neg, mul, imul, div, idiv. */
4426 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4427 && i.tm.extension_opcode != 1)
4428 return 1;
4429
4430 /* inc, dec. */
4431 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4432 return 1;
4433
4434 /* add, or, adc, sbb, and, sub, xor, cmp. */
4435 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4436 return 1;
4437
4438 /* bt, bts, btr, btc. */
4439 if (i.tm.base_opcode == 0xfba
4440 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4441 return 1;
4442
4443 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4444 if ((base_opcode == 0xc1
4445 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4446 && i.tm.extension_opcode != 6)
4447 return 1;
4448
4449 /* cmpxchg8b, cmpxchg16b, xrstors. */
4450 if (i.tm.base_opcode == 0xfc7
4451 && i.tm.opcode_modifier.opcodeprefix == 0
4452 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4453 return 1;
4454
4455 /* fxrstor, ldmxcsr, xrstor. */
4456 if (i.tm.base_opcode == 0xfae
4457 && (i.tm.extension_opcode == 1
4458 || i.tm.extension_opcode == 2
4459 || i.tm.extension_opcode == 5))
4460 return 1;
4461
4462 /* lgdt, lidt, lmsw. */
4463 if (i.tm.base_opcode == 0xf01
4464 && (i.tm.extension_opcode == 2
4465 || i.tm.extension_opcode == 3
4466 || i.tm.extension_opcode == 6))
4467 return 1;
4468
4469 /* vmptrld */
4470 if (i.tm.base_opcode == 0xfc7
4471 && i.tm.opcode_modifier.opcodeprefix == 0
4472 && i.tm.extension_opcode == 6)
4473 return 1;
4474
4475 /* Check for x87 instructions. */
4476 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4477 {
4478 /* Skip fst, fstp, fstenv, fstcw. */
4479 if (i.tm.base_opcode == 0xd9
4480 && (i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 6
4483 || i.tm.extension_opcode == 7))
4484 return 0;
4485
4486 /* Skip fisttp, fist, fistp, fstp. */
4487 if (i.tm.base_opcode == 0xdb
4488 && (i.tm.extension_opcode == 1
4489 || i.tm.extension_opcode == 2
4490 || i.tm.extension_opcode == 3
4491 || i.tm.extension_opcode == 7))
4492 return 0;
4493
4494 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4495 if (i.tm.base_opcode == 0xdd
4496 && (i.tm.extension_opcode == 1
4497 || i.tm.extension_opcode == 2
4498 || i.tm.extension_opcode == 3
4499 || i.tm.extension_opcode == 6
4500 || i.tm.extension_opcode == 7))
4501 return 0;
4502
4503 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4504 if (i.tm.base_opcode == 0xdf
4505 && (i.tm.extension_opcode == 1
4506 || i.tm.extension_opcode == 2
4507 || i.tm.extension_opcode == 3
4508 || i.tm.extension_opcode == 6
4509 || i.tm.extension_opcode == 7))
4510 return 0;
4511
4512 return 1;
4513 }
4514 }
4515
4516 dest = i.operands - 1;
4517
4518 /* Check fake imm8 operand and 3 source operands. */
4519 if ((i.tm.opcode_modifier.immext
4520 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4521 && i.types[dest].bitfield.imm8)
4522 dest--;
4523
4524 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4525 if (!any_vex_p
4526 && (base_opcode == 0x1
4527 || base_opcode == 0x9
4528 || base_opcode == 0x11
4529 || base_opcode == 0x19
4530 || base_opcode == 0x21
4531 || base_opcode == 0x29
4532 || base_opcode == 0x31
4533 || base_opcode == 0x39
4534 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4535 || base_opcode == 0xfc1))
4536 return 1;
4537
4538 /* Check for load instruction. */
4539 return (i.types[dest].bitfield.class != ClassNone
4540 || i.types[dest].bitfield.instance == Accum);
4541 }
4542
4543 /* Output lfence, 0xfaee8, after instruction. */
4544
4545 static void
4546 insert_lfence_after (void)
4547 {
4548 if (lfence_after_load && load_insn_p ())
4549 {
4550 /* There are also two REP string instructions that require
4551 special treatment. Specifically, the compare string (CMPS)
4552 and scan string (SCAS) instructions set EFLAGS in a manner
4553 that depends on the data being compared/scanned. When used
4554 with a REP prefix, the number of iterations may therefore
4555 vary depending on this data. If the data is a program secret
4556 chosen by the adversary using an LVI method,
4557 then this data-dependent behavior may leak some aspect
4558 of the secret. */
4559 if (((i.tm.base_opcode | 0x1) == 0xa7
4560 || (i.tm.base_opcode | 0x1) == 0xaf)
4561 && i.prefix[REP_PREFIX])
4562 {
4563 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4564 i.tm.name);
4565 }
4566 char *p = frag_more (3);
4567 *p++ = 0xf;
4568 *p++ = 0xae;
4569 *p = 0xe8;
4570 }
4571 }
4572
4573 /* Output lfence, 0xfaee8, before instruction. */
4574
4575 static void
4576 insert_lfence_before (void)
4577 {
4578 char *p;
4579
4580 if (is_any_vex_encoding (&i.tm))
4581 return;
4582
4583 if (i.tm.base_opcode == 0xff
4584 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4585 {
4586 /* Insert lfence before indirect branch if needed. */
4587
4588 if (lfence_before_indirect_branch == lfence_branch_none)
4589 return;
4590
4591 if (i.operands != 1)
4592 abort ();
4593
4594 if (i.reg_operands == 1)
4595 {
4596 /* Indirect branch via register. Don't insert lfence with
4597 -mlfence-after-load=yes. */
4598 if (lfence_after_load
4599 || lfence_before_indirect_branch == lfence_branch_memory)
4600 return;
4601 }
4602 else if (i.mem_operands == 1
4603 && lfence_before_indirect_branch != lfence_branch_register)
4604 {
4605 as_warn (_("indirect `%s` with memory operand should be avoided"),
4606 i.tm.name);
4607 return;
4608 }
4609 else
4610 return;
4611
4612 if (last_insn.kind != last_insn_other
4613 && last_insn.seg == now_seg)
4614 {
4615 as_warn_where (last_insn.file, last_insn.line,
4616 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4617 last_insn.name, i.tm.name);
4618 return;
4619 }
4620
4621 p = frag_more (3);
4622 *p++ = 0xf;
4623 *p++ = 0xae;
4624 *p = 0xe8;
4625 return;
4626 }
4627
4628 /* Output or/not/shl and lfence before near ret. */
4629 if (lfence_before_ret != lfence_before_ret_none
4630 && (i.tm.base_opcode == 0xc2
4631 || i.tm.base_opcode == 0xc3))
4632 {
4633 if (last_insn.kind != last_insn_other
4634 && last_insn.seg == now_seg)
4635 {
4636 as_warn_where (last_insn.file, last_insn.line,
4637 _("`%s` skips -mlfence-before-ret on `%s`"),
4638 last_insn.name, i.tm.name);
4639 return;
4640 }
4641
4642 /* Near ret ingore operand size override under CPU64. */
4643 char prefix = flag_code == CODE_64BIT
4644 ? 0x48
4645 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4646
4647 if (lfence_before_ret == lfence_before_ret_not)
4648 {
4649 /* not: 0xf71424, may add prefix
4650 for operand size override or 64-bit code. */
4651 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4652 if (prefix)
4653 *p++ = prefix;
4654 *p++ = 0xf7;
4655 *p++ = 0x14;
4656 *p++ = 0x24;
4657 if (prefix)
4658 *p++ = prefix;
4659 *p++ = 0xf7;
4660 *p++ = 0x14;
4661 *p++ = 0x24;
4662 }
4663 else
4664 {
4665 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4666 if (prefix)
4667 *p++ = prefix;
4668 if (lfence_before_ret == lfence_before_ret_or)
4669 {
4670 /* or: 0x830c2400, may add prefix
4671 for operand size override or 64-bit code. */
4672 *p++ = 0x83;
4673 *p++ = 0x0c;
4674 }
4675 else
4676 {
4677 /* shl: 0xc1242400, may add prefix
4678 for operand size override or 64-bit code. */
4679 *p++ = 0xc1;
4680 *p++ = 0x24;
4681 }
4682
4683 *p++ = 0x24;
4684 *p++ = 0x0;
4685 }
4686
4687 *p++ = 0xf;
4688 *p++ = 0xae;
4689 *p = 0xe8;
4690 }
4691 }
4692
4693 /* This is the guts of the machine-dependent assembler. LINE points to a
4694 machine dependent instruction. This function is supposed to emit
4695 the frags/bytes it assembles to. */
4696
4697 void
4698 md_assemble (char *line)
4699 {
4700 unsigned int j;
4701 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4702 const insn_template *t;
4703
4704 /* Initialize globals. */
4705 memset (&i, '\0', sizeof (i));
4706 for (j = 0; j < MAX_OPERANDS; j++)
4707 i.reloc[j] = NO_RELOC;
4708 memset (disp_expressions, '\0', sizeof (disp_expressions));
4709 memset (im_expressions, '\0', sizeof (im_expressions));
4710 save_stack_p = save_stack;
4711
4712 /* First parse an instruction mnemonic & call i386_operand for the operands.
4713 We assume that the scrubber has arranged it so that line[0] is the valid
4714 start of a (possibly prefixed) mnemonic. */
4715
4716 line = parse_insn (line, mnemonic);
4717 if (line == NULL)
4718 return;
4719 mnem_suffix = i.suffix;
4720
4721 line = parse_operands (line, mnemonic);
4722 this_operand = -1;
4723 xfree (i.memop1_string);
4724 i.memop1_string = NULL;
4725 if (line == NULL)
4726 return;
4727
4728 /* Now we've parsed the mnemonic into a set of templates, and have the
4729 operands at hand. */
4730
4731 /* All Intel opcodes have reversed operands except for "bound", "enter",
4732 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4733 intersegment "jmp" and "call" instructions with 2 immediate operands so
4734 that the immediate segment precedes the offset, as it does when in AT&T
4735 mode. */
4736 if (intel_syntax
4737 && i.operands > 1
4738 && (strcmp (mnemonic, "bound") != 0)
4739 && (strcmp (mnemonic, "invlpga") != 0)
4740 && (strncmp (mnemonic, "monitor", 7) != 0)
4741 && (strncmp (mnemonic, "mwait", 5) != 0)
4742 && (strcmp (mnemonic, "tpause") != 0)
4743 && (strcmp (mnemonic, "umwait") != 0)
4744 && !(operand_type_check (i.types[0], imm)
4745 && operand_type_check (i.types[1], imm)))
4746 swap_operands ();
4747
4748 /* The order of the immediates should be reversed
4749 for 2 immediates extrq and insertq instructions */
4750 if (i.imm_operands == 2
4751 && (strcmp (mnemonic, "extrq") == 0
4752 || strcmp (mnemonic, "insertq") == 0))
4753 swap_2_operands (0, 1);
4754
4755 if (i.imm_operands)
4756 optimize_imm ();
4757
4758 /* Don't optimize displacement for movabs since it only takes 64bit
4759 displacement. */
4760 if (i.disp_operands
4761 && i.disp_encoding != disp_encoding_32bit
4762 && (flag_code != CODE_64BIT
4763 || strcmp (mnemonic, "movabs") != 0))
4764 optimize_disp ();
4765
4766 /* Next, we find a template that matches the given insn,
4767 making sure the overlap of the given operands types is consistent
4768 with the template operand types. */
4769
4770 if (!(t = match_template (mnem_suffix)))
4771 return;
4772
4773 if (sse_check != check_none
4774 && !i.tm.opcode_modifier.noavx
4775 && !i.tm.cpu_flags.bitfield.cpuavx
4776 && !i.tm.cpu_flags.bitfield.cpuavx512f
4777 && (i.tm.cpu_flags.bitfield.cpusse
4778 || i.tm.cpu_flags.bitfield.cpusse2
4779 || i.tm.cpu_flags.bitfield.cpusse3
4780 || i.tm.cpu_flags.bitfield.cpussse3
4781 || i.tm.cpu_flags.bitfield.cpusse4_1
4782 || i.tm.cpu_flags.bitfield.cpusse4_2
4783 || i.tm.cpu_flags.bitfield.cpupclmul
4784 || i.tm.cpu_flags.bitfield.cpuaes
4785 || i.tm.cpu_flags.bitfield.cpusha
4786 || i.tm.cpu_flags.bitfield.cpugfni))
4787 {
4788 (sse_check == check_warning
4789 ? as_warn
4790 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4791 }
4792
4793 if (i.tm.opcode_modifier.fwait)
4794 if (!add_prefix (FWAIT_OPCODE))
4795 return;
4796
4797 /* Check if REP prefix is OK. */
4798 if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4799 {
4800 as_bad (_("invalid instruction `%s' after `%s'"),
4801 i.tm.name, i.rep_prefix);
4802 return;
4803 }
4804
4805 /* Check for lock without a lockable instruction. Destination operand
4806 must be memory unless it is xchg (0x86). */
4807 if (i.prefix[LOCK_PREFIX]
4808 && (i.tm.opcode_modifier.prefixok < PrefixLock
4809 || i.mem_operands == 0
4810 || (i.tm.base_opcode != 0x86
4811 && !(i.flags[i.operands - 1] & Operand_Mem))))
4812 {
4813 as_bad (_("expecting lockable instruction after `lock'"));
4814 return;
4815 }
4816
4817 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4818 if (i.prefix[DATA_PREFIX]
4819 && (is_any_vex_encoding (&i.tm)
4820 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4821 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4822 {
4823 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4824 return;
4825 }
4826
4827 /* Check if HLE prefix is OK. */
4828 if (i.hle_prefix && !check_hle ())
4829 return;
4830
4831 /* Check BND prefix. */
4832 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4833 as_bad (_("expecting valid branch instruction after `bnd'"));
4834
4835 /* Check NOTRACK prefix. */
4836 if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
4837 as_bad (_("expecting indirect branch instruction after `notrack'"));
4838
4839 if (i.tm.cpu_flags.bitfield.cpumpx)
4840 {
4841 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4842 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4843 else if (flag_code != CODE_16BIT
4844 ? i.prefix[ADDR_PREFIX]
4845 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4846 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4847 }
4848
4849 /* Insert BND prefix. */
4850 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4851 {
4852 if (!i.prefix[BND_PREFIX])
4853 add_prefix (BND_PREFIX_OPCODE);
4854 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4855 {
4856 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4857 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4858 }
4859 }
4860
4861 /* Check string instruction segment overrides. */
4862 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4863 {
4864 gas_assert (i.mem_operands);
4865 if (!check_string ())
4866 return;
4867 i.disp_operands = 0;
4868 }
4869
4870 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4871 optimize_encoding ();
4872
4873 if (!process_suffix ())
4874 return;
4875
4876 /* Update operand types and check extended states. */
4877 for (j = 0; j < i.operands; j++)
4878 {
4879 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4880 switch (i.tm.operand_types[j].bitfield.class)
4881 {
4882 default:
4883 break;
4884 case RegMMX:
4885 i.xstate |= xstate_mmx;
4886 break;
4887 case RegMask:
4888 i.xstate |= xstate_mask;
4889 break;
4890 case RegSIMD:
4891 if (i.tm.operand_types[j].bitfield.tmmword)
4892 i.xstate |= xstate_tmm;
4893 else if (i.tm.operand_types[j].bitfield.zmmword)
4894 i.xstate |= xstate_zmm;
4895 else if (i.tm.operand_types[j].bitfield.ymmword)
4896 i.xstate |= xstate_ymm;
4897 else if (i.tm.operand_types[j].bitfield.xmmword)
4898 i.xstate |= xstate_xmm;
4899 break;
4900 }
4901 }
4902
4903 /* Make still unresolved immediate matches conform to size of immediate
4904 given in i.suffix. */
4905 if (!finalize_imm ())
4906 return;
4907
4908 if (i.types[0].bitfield.imm1)
4909 i.imm_operands = 0; /* kludge for shift insns. */
4910
4911 /* We only need to check those implicit registers for instructions
4912 with 3 operands or less. */
4913 if (i.operands <= 3)
4914 for (j = 0; j < i.operands; j++)
4915 if (i.types[j].bitfield.instance != InstanceNone
4916 && !i.types[j].bitfield.xmmword)
4917 i.reg_operands--;
4918
4919 /* For insns with operands there are more diddles to do to the opcode. */
4920 if (i.operands)
4921 {
4922 if (!process_operands ())
4923 return;
4924 }
4925 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4926 {
4927 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4928 as_warn (_("translating to `%sp'"), i.tm.name);
4929 }
4930
4931 if (is_any_vex_encoding (&i.tm))
4932 {
4933 if (!cpu_arch_flags.bitfield.cpui286)
4934 {
4935 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4936 i.tm.name);
4937 return;
4938 }
4939
4940 /* Check for explicit REX prefix. */
4941 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4942 {
4943 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4944 return;
4945 }
4946
4947 if (i.tm.opcode_modifier.vex)
4948 build_vex_prefix (t);
4949 else
4950 build_evex_prefix ();
4951
4952 /* The individual REX.RXBW bits got consumed. */
4953 i.rex &= REX_OPCODE;
4954 }
4955
4956 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4957 instructions may define INT_OPCODE as well, so avoid this corner
4958 case for those instructions that use MODRM. */
4959 if (i.tm.base_opcode == INT_OPCODE
4960 && !i.tm.opcode_modifier.modrm
4961 && i.op[0].imms->X_add_number == 3)
4962 {
4963 i.tm.base_opcode = INT3_OPCODE;
4964 i.imm_operands = 0;
4965 }
4966
4967 if ((i.tm.opcode_modifier.jump == JUMP
4968 || i.tm.opcode_modifier.jump == JUMP_BYTE
4969 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4970 && i.op[0].disps->X_op == O_constant)
4971 {
4972 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4973 the absolute address given by the constant. Since ix86 jumps and
4974 calls are pc relative, we need to generate a reloc. */
4975 i.op[0].disps->X_add_symbol = &abs_symbol;
4976 i.op[0].disps->X_op = O_symbol;
4977 }
4978
4979 /* For 8 bit registers we need an empty rex prefix. Also if the
4980 instruction already has a prefix, we need to convert old
4981 registers to new ones. */
4982
4983 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4984 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4985 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4986 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4987 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4988 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4989 && i.rex != 0))
4990 {
4991 int x;
4992
4993 i.rex |= REX_OPCODE;
4994 for (x = 0; x < 2; x++)
4995 {
4996 /* Look for 8 bit operand that uses old registers. */
4997 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4998 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4999 {
5000 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5001 /* In case it is "hi" register, give up. */
5002 if (i.op[x].regs->reg_num > 3)
5003 as_bad (_("can't encode register '%s%s' in an "
5004 "instruction requiring REX prefix."),
5005 register_prefix, i.op[x].regs->reg_name);
5006
5007 /* Otherwise it is equivalent to the extended register.
5008 Since the encoding doesn't change this is merely
5009 cosmetic cleanup for debug output. */
5010
5011 i.op[x].regs = i.op[x].regs + 8;
5012 }
5013 }
5014 }
5015
5016 if (i.rex == 0 && i.rex_encoding)
5017 {
5018 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
5019 that uses legacy register. If it is "hi" register, don't add
5020 the REX_OPCODE byte. */
5021 int x;
5022 for (x = 0; x < 2; x++)
5023 if (i.types[x].bitfield.class == Reg
5024 && i.types[x].bitfield.byte
5025 && (i.op[x].regs->reg_flags & RegRex64) == 0
5026 && i.op[x].regs->reg_num > 3)
5027 {
5028 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5029 i.rex_encoding = FALSE;
5030 break;
5031 }
5032
5033 if (i.rex_encoding)
5034 i.rex = REX_OPCODE;
5035 }
5036
5037 if (i.rex != 0)
5038 add_prefix (REX_OPCODE | i.rex);
5039
5040 insert_lfence_before ();
5041
5042 /* We are ready to output the insn. */
5043 output_insn ();
5044
5045 insert_lfence_after ();
5046
5047 last_insn.seg = now_seg;
5048
5049 if (i.tm.opcode_modifier.isprefix)
5050 {
5051 last_insn.kind = last_insn_prefix;
5052 last_insn.name = i.tm.name;
5053 last_insn.file = as_where (&last_insn.line);
5054 }
5055 else
5056 last_insn.kind = last_insn_other;
5057 }
5058
5059 static char *
5060 parse_insn (char *line, char *mnemonic)
5061 {
5062 char *l = line;
5063 char *token_start = l;
5064 char *mnem_p;
5065 int supported;
5066 const insn_template *t;
5067 char *dot_p = NULL;
5068
5069 while (1)
5070 {
5071 mnem_p = mnemonic;
5072 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5073 {
5074 if (*mnem_p == '.')
5075 dot_p = mnem_p;
5076 mnem_p++;
5077 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5078 {
5079 as_bad (_("no such instruction: `%s'"), token_start);
5080 return NULL;
5081 }
5082 l++;
5083 }
5084 if (!is_space_char (*l)
5085 && *l != END_OF_INSN
5086 && (intel_syntax
5087 || (*l != PREFIX_SEPARATOR
5088 && *l != ',')))
5089 {
5090 as_bad (_("invalid character %s in mnemonic"),
5091 output_invalid (*l));
5092 return NULL;
5093 }
5094 if (token_start == l)
5095 {
5096 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5097 as_bad (_("expecting prefix; got nothing"));
5098 else
5099 as_bad (_("expecting mnemonic; got nothing"));
5100 return NULL;
5101 }
5102
5103 /* Look up instruction (or prefix) via hash table. */
5104 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5105
5106 if (*l != END_OF_INSN
5107 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5108 && current_templates
5109 && current_templates->start->opcode_modifier.isprefix)
5110 {
5111 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5112 {
5113 as_bad ((flag_code != CODE_64BIT
5114 ? _("`%s' is only supported in 64-bit mode")
5115 : _("`%s' is not supported in 64-bit mode")),
5116 current_templates->start->name);
5117 return NULL;
5118 }
5119 /* If we are in 16-bit mode, do not allow addr16 or data16.
5120 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5121 if ((current_templates->start->opcode_modifier.size == SIZE16
5122 || current_templates->start->opcode_modifier.size == SIZE32)
5123 && flag_code != CODE_64BIT
5124 && ((current_templates->start->opcode_modifier.size == SIZE32)
5125 ^ (flag_code == CODE_16BIT)))
5126 {
5127 as_bad (_("redundant %s prefix"),
5128 current_templates->start->name);
5129 return NULL;
5130 }
5131 if (current_templates->start->opcode_length == 0)
5132 {
5133 /* Handle pseudo prefixes. */
5134 switch (current_templates->start->base_opcode)
5135 {
5136 case Prefix_Disp8:
5137 /* {disp8} */
5138 i.disp_encoding = disp_encoding_8bit;
5139 break;
5140 case Prefix_Disp16:
5141 /* {disp16} */
5142 i.disp_encoding = disp_encoding_16bit;
5143 break;
5144 case Prefix_Disp32:
5145 /* {disp32} */
5146 i.disp_encoding = disp_encoding_32bit;
5147 break;
5148 case Prefix_Load:
5149 /* {load} */
5150 i.dir_encoding = dir_encoding_load;
5151 break;
5152 case Prefix_Store:
5153 /* {store} */
5154 i.dir_encoding = dir_encoding_store;
5155 break;
5156 case Prefix_VEX:
5157 /* {vex} */
5158 i.vec_encoding = vex_encoding_vex;
5159 break;
5160 case Prefix_VEX3:
5161 /* {vex3} */
5162 i.vec_encoding = vex_encoding_vex3;
5163 break;
5164 case Prefix_EVEX:
5165 /* {evex} */
5166 i.vec_encoding = vex_encoding_evex;
5167 break;
5168 case Prefix_REX:
5169 /* {rex} */
5170 i.rex_encoding = TRUE;
5171 break;
5172 case Prefix_NoOptimize:
5173 /* {nooptimize} */
5174 i.no_optimize = TRUE;
5175 break;
5176 default:
5177 abort ();
5178 }
5179 }
5180 else
5181 {
5182 /* Add prefix, checking for repeated prefixes. */
5183 switch (add_prefix (current_templates->start->base_opcode))
5184 {
5185 case PREFIX_EXIST:
5186 return NULL;
5187 case PREFIX_DS:
5188 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5189 i.notrack_prefix = current_templates->start->name;
5190 break;
5191 case PREFIX_REP:
5192 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5193 i.hle_prefix = current_templates->start->name;
5194 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5195 i.bnd_prefix = current_templates->start->name;
5196 else
5197 i.rep_prefix = current_templates->start->name;
5198 break;
5199 default:
5200 break;
5201 }
5202 }
5203 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5204 token_start = ++l;
5205 }
5206 else
5207 break;
5208 }
5209
5210 if (!current_templates)
5211 {
5212 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5213 Check if we should swap operand or force 32bit displacement in
5214 encoding. */
5215 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5216 i.dir_encoding = dir_encoding_swap;
5217 else if (mnem_p - 3 == dot_p
5218 && dot_p[1] == 'd'
5219 && dot_p[2] == '8')
5220 i.disp_encoding = disp_encoding_8bit;
5221 else if (mnem_p - 4 == dot_p
5222 && dot_p[1] == 'd'
5223 && dot_p[2] == '3'
5224 && dot_p[3] == '2')
5225 i.disp_encoding = disp_encoding_32bit;
5226 else
5227 goto check_suffix;
5228 mnem_p = dot_p;
5229 *dot_p = '\0';
5230 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5231 }
5232
5233 if (!current_templates)
5234 {
5235 check_suffix:
5236 if (mnem_p > mnemonic)
5237 {
5238 /* See if we can get a match by trimming off a suffix. */
5239 switch (mnem_p[-1])
5240 {
5241 case WORD_MNEM_SUFFIX:
5242 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5243 i.suffix = SHORT_MNEM_SUFFIX;
5244 else
5245 /* Fall through. */
5246 case BYTE_MNEM_SUFFIX:
5247 case QWORD_MNEM_SUFFIX:
5248 i.suffix = mnem_p[-1];
5249 mnem_p[-1] = '\0';
5250 current_templates
5251 = (const templates *) str_hash_find (op_hash, mnemonic);
5252 break;
5253 case SHORT_MNEM_SUFFIX:
5254 case LONG_MNEM_SUFFIX:
5255 if (!intel_syntax)
5256 {
5257 i.suffix = mnem_p[-1];
5258 mnem_p[-1] = '\0';
5259 current_templates
5260 = (const templates *) str_hash_find (op_hash, mnemonic);
5261 }
5262 break;
5263
5264 /* Intel Syntax. */
5265 case 'd':
5266 if (intel_syntax)
5267 {
5268 if (intel_float_operand (mnemonic) == 1)
5269 i.suffix = SHORT_MNEM_SUFFIX;
5270 else
5271 i.suffix = LONG_MNEM_SUFFIX;
5272 mnem_p[-1] = '\0';
5273 current_templates
5274 = (const templates *) str_hash_find (op_hash, mnemonic);
5275 }
5276 break;
5277 }
5278 }
5279
5280 if (!current_templates)
5281 {
5282 as_bad (_("no such instruction: `%s'"), token_start);
5283 return NULL;
5284 }
5285 }
5286
5287 if (current_templates->start->opcode_modifier.jump == JUMP
5288 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5289 {
5290 /* Check for a branch hint. We allow ",pt" and ",pn" for
5291 predict taken and predict not taken respectively.
5292 I'm not sure that branch hints actually do anything on loop
5293 and jcxz insns (JumpByte) for current Pentium4 chips. They
5294 may work in the future and it doesn't hurt to accept them
5295 now. */
5296 if (l[0] == ',' && l[1] == 'p')
5297 {
5298 if (l[2] == 't')
5299 {
5300 if (!add_prefix (DS_PREFIX_OPCODE))
5301 return NULL;
5302 l += 3;
5303 }
5304 else if (l[2] == 'n')
5305 {
5306 if (!add_prefix (CS_PREFIX_OPCODE))
5307 return NULL;
5308 l += 3;
5309 }
5310 }
5311 }
5312 /* Any other comma loses. */
5313 if (*l == ',')
5314 {
5315 as_bad (_("invalid character %s in mnemonic"),
5316 output_invalid (*l));
5317 return NULL;
5318 }
5319
5320 /* Check if instruction is supported on specified architecture. */
5321 supported = 0;
5322 for (t = current_templates->start; t < current_templates->end; ++t)
5323 {
5324 supported |= cpu_flags_match (t);
5325 if (supported == CPU_FLAGS_PERFECT_MATCH)
5326 {
5327 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5328 as_warn (_("use .code16 to ensure correct addressing mode"));
5329
5330 return l;
5331 }
5332 }
5333
5334 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5335 as_bad (flag_code == CODE_64BIT
5336 ? _("`%s' is not supported in 64-bit mode")
5337 : _("`%s' is only supported in 64-bit mode"),
5338 current_templates->start->name);
5339 else
5340 as_bad (_("`%s' is not supported on `%s%s'"),
5341 current_templates->start->name,
5342 cpu_arch_name ? cpu_arch_name : default_arch,
5343 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5344
5345 return NULL;
5346 }
5347
5348 static char *
5349 parse_operands (char *l, const char *mnemonic)
5350 {
5351 char *token_start;
5352
5353 /* 1 if operand is pending after ','. */
5354 unsigned int expecting_operand = 0;
5355
5356 /* Non-zero if operand parens not balanced. */
5357 unsigned int paren_not_balanced;
5358
5359 while (*l != END_OF_INSN)
5360 {
5361 /* Skip optional white space before operand. */
5362 if (is_space_char (*l))
5363 ++l;
5364 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5365 {
5366 as_bad (_("invalid character %s before operand %d"),
5367 output_invalid (*l),
5368 i.operands + 1);
5369 return NULL;
5370 }
5371 token_start = l; /* After white space. */
5372 paren_not_balanced = 0;
5373 while (paren_not_balanced || *l != ',')
5374 {
5375 if (*l == END_OF_INSN)
5376 {
5377 if (paren_not_balanced)
5378 {
5379 if (!intel_syntax)
5380 as_bad (_("unbalanced parenthesis in operand %d."),
5381 i.operands + 1);
5382 else
5383 as_bad (_("unbalanced brackets in operand %d."),
5384 i.operands + 1);
5385 return NULL;
5386 }
5387 else
5388 break; /* we are done */
5389 }
5390 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5391 {
5392 as_bad (_("invalid character %s in operand %d"),
5393 output_invalid (*l),
5394 i.operands + 1);
5395 return NULL;
5396 }
5397 if (!intel_syntax)
5398 {
5399 if (*l == '(')
5400 ++paren_not_balanced;
5401 if (*l == ')')
5402 --paren_not_balanced;
5403 }
5404 else
5405 {
5406 if (*l == '[')
5407 ++paren_not_balanced;
5408 if (*l == ']')
5409 --paren_not_balanced;
5410 }
5411 l++;
5412 }
5413 if (l != token_start)
5414 { /* Yes, we've read in another operand. */
5415 unsigned int operand_ok;
5416 this_operand = i.operands++;
5417 if (i.operands > MAX_OPERANDS)
5418 {
5419 as_bad (_("spurious operands; (%d operands/instruction max)"),
5420 MAX_OPERANDS);
5421 return NULL;
5422 }
5423 i.types[this_operand].bitfield.unspecified = 1;
5424 /* Now parse operand adding info to 'i' as we go along. */
5425 END_STRING_AND_SAVE (l);
5426
5427 if (i.mem_operands > 1)
5428 {
5429 as_bad (_("too many memory references for `%s'"),
5430 mnemonic);
5431 return 0;
5432 }
5433
5434 if (intel_syntax)
5435 operand_ok =
5436 i386_intel_operand (token_start,
5437 intel_float_operand (mnemonic));
5438 else
5439 operand_ok = i386_att_operand (token_start);
5440
5441 RESTORE_END_STRING (l);
5442 if (!operand_ok)
5443 return NULL;
5444 }
5445 else
5446 {
5447 if (expecting_operand)
5448 {
5449 expecting_operand_after_comma:
5450 as_bad (_("expecting operand after ','; got nothing"));
5451 return NULL;
5452 }
5453 if (*l == ',')
5454 {
5455 as_bad (_("expecting operand before ','; got nothing"));
5456 return NULL;
5457 }
5458 }
5459
5460 /* Now *l must be either ',' or END_OF_INSN. */
5461 if (*l == ',')
5462 {
5463 if (*++l == END_OF_INSN)
5464 {
5465 /* Just skip it, if it's \n complain. */
5466 goto expecting_operand_after_comma;
5467 }
5468 expecting_operand = 1;
5469 }
5470 }
5471 return l;
5472 }
5473
5474 static void
5475 swap_2_operands (int xchg1, int xchg2)
5476 {
5477 union i386_op temp_op;
5478 i386_operand_type temp_type;
5479 unsigned int temp_flags;
5480 enum bfd_reloc_code_real temp_reloc;
5481
5482 temp_type = i.types[xchg2];
5483 i.types[xchg2] = i.types[xchg1];
5484 i.types[xchg1] = temp_type;
5485
5486 temp_flags = i.flags[xchg2];
5487 i.flags[xchg2] = i.flags[xchg1];
5488 i.flags[xchg1] = temp_flags;
5489
5490 temp_op = i.op[xchg2];
5491 i.op[xchg2] = i.op[xchg1];
5492 i.op[xchg1] = temp_op;
5493
5494 temp_reloc = i.reloc[xchg2];
5495 i.reloc[xchg2] = i.reloc[xchg1];
5496 i.reloc[xchg1] = temp_reloc;
5497
5498 if (i.mask)
5499 {
5500 if (i.mask->operand == xchg1)
5501 i.mask->operand = xchg2;
5502 else if (i.mask->operand == xchg2)
5503 i.mask->operand = xchg1;
5504 }
5505 if (i.broadcast)
5506 {
5507 if (i.broadcast->operand == xchg1)
5508 i.broadcast->operand = xchg2;
5509 else if (i.broadcast->operand == xchg2)
5510 i.broadcast->operand = xchg1;
5511 }
5512 if (i.rounding)
5513 {
5514 if (i.rounding->operand == xchg1)
5515 i.rounding->operand = xchg2;
5516 else if (i.rounding->operand == xchg2)
5517 i.rounding->operand = xchg1;
5518 }
5519 }
5520
5521 static void
5522 swap_operands (void)
5523 {
5524 switch (i.operands)
5525 {
5526 case 5:
5527 case 4:
5528 swap_2_operands (1, i.operands - 2);
5529 /* Fall through. */
5530 case 3:
5531 case 2:
5532 swap_2_operands (0, i.operands - 1);
5533 break;
5534 default:
5535 abort ();
5536 }
5537
5538 if (i.mem_operands == 2)
5539 {
5540 const seg_entry *temp_seg;
5541 temp_seg = i.seg[0];
5542 i.seg[0] = i.seg[1];
5543 i.seg[1] = temp_seg;
5544 }
5545 }
5546
5547 /* Try to ensure constant immediates are represented in the smallest
5548 opcode possible. */
5549 static void
5550 optimize_imm (void)
5551 {
5552 char guess_suffix = 0;
5553 int op;
5554
5555 if (i.suffix)
5556 guess_suffix = i.suffix;
5557 else if (i.reg_operands)
5558 {
5559 /* Figure out a suffix from the last register operand specified.
5560 We can't do this properly yet, i.e. excluding special register
5561 instances, but the following works for instructions with
5562 immediates. In any case, we can't set i.suffix yet. */
5563 for (op = i.operands; --op >= 0;)
5564 if (i.types[op].bitfield.class != Reg)
5565 continue;
5566 else if (i.types[op].bitfield.byte)
5567 {
5568 guess_suffix = BYTE_MNEM_SUFFIX;
5569 break;
5570 }
5571 else if (i.types[op].bitfield.word)
5572 {
5573 guess_suffix = WORD_MNEM_SUFFIX;
5574 break;
5575 }
5576 else if (i.types[op].bitfield.dword)
5577 {
5578 guess_suffix = LONG_MNEM_SUFFIX;
5579 break;
5580 }
5581 else if (i.types[op].bitfield.qword)
5582 {
5583 guess_suffix = QWORD_MNEM_SUFFIX;
5584 break;
5585 }
5586 }
5587 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5588 guess_suffix = WORD_MNEM_SUFFIX;
5589
5590 for (op = i.operands; --op >= 0;)
5591 if (operand_type_check (i.types[op], imm))
5592 {
5593 switch (i.op[op].imms->X_op)
5594 {
5595 case O_constant:
5596 /* If a suffix is given, this operand may be shortened. */
5597 switch (guess_suffix)
5598 {
5599 case LONG_MNEM_SUFFIX:
5600 i.types[op].bitfield.imm32 = 1;
5601 i.types[op].bitfield.imm64 = 1;
5602 break;
5603 case WORD_MNEM_SUFFIX:
5604 i.types[op].bitfield.imm16 = 1;
5605 i.types[op].bitfield.imm32 = 1;
5606 i.types[op].bitfield.imm32s = 1;
5607 i.types[op].bitfield.imm64 = 1;
5608 break;
5609 case BYTE_MNEM_SUFFIX:
5610 i.types[op].bitfield.imm8 = 1;
5611 i.types[op].bitfield.imm8s = 1;
5612 i.types[op].bitfield.imm16 = 1;
5613 i.types[op].bitfield.imm32 = 1;
5614 i.types[op].bitfield.imm32s = 1;
5615 i.types[op].bitfield.imm64 = 1;
5616 break;
5617 }
5618
5619 /* If this operand is at most 16 bits, convert it
5620 to a signed 16 bit number before trying to see
5621 whether it will fit in an even smaller size.
5622 This allows a 16-bit operand such as $0xffe0 to
5623 be recognised as within Imm8S range. */
5624 if ((i.types[op].bitfield.imm16)
5625 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5626 {
5627 i.op[op].imms->X_add_number =
5628 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5629 }
5630 #ifdef BFD64
5631 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5632 if ((i.types[op].bitfield.imm32)
5633 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5634 == 0))
5635 {
5636 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5637 ^ ((offsetT) 1 << 31))
5638 - ((offsetT) 1 << 31));
5639 }
5640 #endif
5641 i.types[op]
5642 = operand_type_or (i.types[op],
5643 smallest_imm_type (i.op[op].imms->X_add_number));
5644
5645 /* We must avoid matching of Imm32 templates when 64bit
5646 only immediate is available. */
5647 if (guess_suffix == QWORD_MNEM_SUFFIX)
5648 i.types[op].bitfield.imm32 = 0;
5649 break;
5650
5651 case O_absent:
5652 case O_register:
5653 abort ();
5654
5655 /* Symbols and expressions. */
5656 default:
5657 /* Convert symbolic operand to proper sizes for matching, but don't
5658 prevent matching a set of insns that only supports sizes other
5659 than those matching the insn suffix. */
5660 {
5661 i386_operand_type mask, allowed;
5662 const insn_template *t;
5663
5664 operand_type_set (&mask, 0);
5665 operand_type_set (&allowed, 0);
5666
5667 for (t = current_templates->start;
5668 t < current_templates->end;
5669 ++t)
5670 {
5671 allowed = operand_type_or (allowed, t->operand_types[op]);
5672 allowed = operand_type_and (allowed, anyimm);
5673 }
5674 switch (guess_suffix)
5675 {
5676 case QWORD_MNEM_SUFFIX:
5677 mask.bitfield.imm64 = 1;
5678 mask.bitfield.imm32s = 1;
5679 break;
5680 case LONG_MNEM_SUFFIX:
5681 mask.bitfield.imm32 = 1;
5682 break;
5683 case WORD_MNEM_SUFFIX:
5684 mask.bitfield.imm16 = 1;
5685 break;
5686 case BYTE_MNEM_SUFFIX:
5687 mask.bitfield.imm8 = 1;
5688 break;
5689 default:
5690 break;
5691 }
5692 allowed = operand_type_and (mask, allowed);
5693 if (!operand_type_all_zero (&allowed))
5694 i.types[op] = operand_type_and (i.types[op], mask);
5695 }
5696 break;
5697 }
5698 }
5699 }
5700
5701 /* Try to use the smallest displacement type too. */
5702 static void
5703 optimize_disp (void)
5704 {
5705 int op;
5706
5707 for (op = i.operands; --op >= 0;)
5708 if (operand_type_check (i.types[op], disp))
5709 {
5710 if (i.op[op].disps->X_op == O_constant)
5711 {
5712 offsetT op_disp = i.op[op].disps->X_add_number;
5713
5714 if (i.types[op].bitfield.disp16
5715 && (op_disp & ~(offsetT) 0xffff) == 0)
5716 {
5717 /* If this operand is at most 16 bits, convert
5718 to a signed 16 bit number and don't use 64bit
5719 displacement. */
5720 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5721 i.types[op].bitfield.disp64 = 0;
5722 }
5723 #ifdef BFD64
5724 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5725 if (i.types[op].bitfield.disp32
5726 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5727 {
5728 /* If this operand is at most 32 bits, convert
5729 to a signed 32 bit number and don't use 64bit
5730 displacement. */
5731 op_disp &= (((offsetT) 2 << 31) - 1);
5732 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5733 i.types[op].bitfield.disp64 = 0;
5734 }
5735 #endif
5736 if (!op_disp && i.types[op].bitfield.baseindex)
5737 {
5738 i.types[op].bitfield.disp8 = 0;
5739 i.types[op].bitfield.disp16 = 0;
5740 i.types[op].bitfield.disp32 = 0;
5741 i.types[op].bitfield.disp32s = 0;
5742 i.types[op].bitfield.disp64 = 0;
5743 i.op[op].disps = 0;
5744 i.disp_operands--;
5745 }
5746 else if (flag_code == CODE_64BIT)
5747 {
5748 if (fits_in_signed_long (op_disp))
5749 {
5750 i.types[op].bitfield.disp64 = 0;
5751 i.types[op].bitfield.disp32s = 1;
5752 }
5753 if (i.prefix[ADDR_PREFIX]
5754 && fits_in_unsigned_long (op_disp))
5755 i.types[op].bitfield.disp32 = 1;
5756 }
5757 if ((i.types[op].bitfield.disp32
5758 || i.types[op].bitfield.disp32s
5759 || i.types[op].bitfield.disp16)
5760 && fits_in_disp8 (op_disp))
5761 i.types[op].bitfield.disp8 = 1;
5762 }
5763 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5764 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5765 {
5766 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5767 i.op[op].disps, 0, i.reloc[op]);
5768 i.types[op].bitfield.disp8 = 0;
5769 i.types[op].bitfield.disp16 = 0;
5770 i.types[op].bitfield.disp32 = 0;
5771 i.types[op].bitfield.disp32s = 0;
5772 i.types[op].bitfield.disp64 = 0;
5773 }
5774 else
5775 /* We only support 64bit displacement on constants. */
5776 i.types[op].bitfield.disp64 = 0;
5777 }
5778 }
5779
5780 /* Return 1 if there is a match in broadcast bytes between operand
5781 GIVEN and instruction template T. */
5782
5783 static INLINE int
5784 match_broadcast_size (const insn_template *t, unsigned int given)
5785 {
5786 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5787 && i.types[given].bitfield.byte)
5788 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5789 && i.types[given].bitfield.word)
5790 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5791 && i.types[given].bitfield.dword)
5792 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5793 && i.types[given].bitfield.qword));
5794 }
5795
5796 /* Check if operands are valid for the instruction. */
5797
5798 static int
5799 check_VecOperands (const insn_template *t)
5800 {
5801 unsigned int op;
5802 i386_cpu_flags cpu;
5803
5804 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5805 any one operand are implicity requiring AVX512VL support if the actual
5806 operand size is YMMword or XMMword. Since this function runs after
5807 template matching, there's no need to check for YMMword/XMMword in
5808 the template. */
5809 cpu = cpu_flags_and (t->cpu_flags, avx512);
5810 if (!cpu_flags_all_zero (&cpu)
5811 && !t->cpu_flags.bitfield.cpuavx512vl
5812 && !cpu_arch_flags.bitfield.cpuavx512vl)
5813 {
5814 for (op = 0; op < t->operands; ++op)
5815 {
5816 if (t->operand_types[op].bitfield.zmmword
5817 && (i.types[op].bitfield.ymmword
5818 || i.types[op].bitfield.xmmword))
5819 {
5820 i.error = unsupported;
5821 return 1;
5822 }
5823 }
5824 }
5825
5826 /* Without VSIB byte, we can't have a vector register for index. */
5827 if (!t->opcode_modifier.sib
5828 && i.index_reg
5829 && (i.index_reg->reg_type.bitfield.xmmword
5830 || i.index_reg->reg_type.bitfield.ymmword
5831 || i.index_reg->reg_type.bitfield.zmmword))
5832 {
5833 i.error = unsupported_vector_index_register;
5834 return 1;
5835 }
5836
5837 /* Check if default mask is allowed. */
5838 if (t->opcode_modifier.nodefmask
5839 && (!i.mask || i.mask->mask->reg_num == 0))
5840 {
5841 i.error = no_default_mask;
5842 return 1;
5843 }
5844
5845 /* For VSIB byte, we need a vector register for index, and all vector
5846 registers must be distinct. */
5847 if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5848 {
5849 if (!i.index_reg
5850 || !((t->opcode_modifier.sib == VECSIB128
5851 && i.index_reg->reg_type.bitfield.xmmword)
5852 || (t->opcode_modifier.sib == VECSIB256
5853 && i.index_reg->reg_type.bitfield.ymmword)
5854 || (t->opcode_modifier.sib == VECSIB512
5855 && i.index_reg->reg_type.bitfield.zmmword)))
5856 {
5857 i.error = invalid_vsib_address;
5858 return 1;
5859 }
5860
5861 gas_assert (i.reg_operands == 2 || i.mask);
5862 if (i.reg_operands == 2 && !i.mask)
5863 {
5864 gas_assert (i.types[0].bitfield.class == RegSIMD);
5865 gas_assert (i.types[0].bitfield.xmmword
5866 || i.types[0].bitfield.ymmword);
5867 gas_assert (i.types[2].bitfield.class == RegSIMD);
5868 gas_assert (i.types[2].bitfield.xmmword
5869 || i.types[2].bitfield.ymmword);
5870 if (operand_check == check_none)
5871 return 0;
5872 if (register_number (i.op[0].regs)
5873 != register_number (i.index_reg)
5874 && register_number (i.op[2].regs)
5875 != register_number (i.index_reg)
5876 && register_number (i.op[0].regs)
5877 != register_number (i.op[2].regs))
5878 return 0;
5879 if (operand_check == check_error)
5880 {
5881 i.error = invalid_vector_register_set;
5882 return 1;
5883 }
5884 as_warn (_("mask, index, and destination registers should be distinct"));
5885 }
5886 else if (i.reg_operands == 1 && i.mask)
5887 {
5888 if (i.types[1].bitfield.class == RegSIMD
5889 && (i.types[1].bitfield.xmmword
5890 || i.types[1].bitfield.ymmword
5891 || i.types[1].bitfield.zmmword)
5892 && (register_number (i.op[1].regs)
5893 == register_number (i.index_reg)))
5894 {
5895 if (operand_check == check_error)
5896 {
5897 i.error = invalid_vector_register_set;
5898 return 1;
5899 }
5900 if (operand_check != check_none)
5901 as_warn (_("index and destination registers should be distinct"));
5902 }
5903 }
5904 }
5905
5906 /* For AMX instructions with three tmmword operands, all tmmword operand must be
5907 distinct */
5908 if (t->operand_types[0].bitfield.tmmword
5909 && i.reg_operands == 3)
5910 {
5911 if (register_number (i.op[0].regs)
5912 == register_number (i.op[1].regs)
5913 || register_number (i.op[0].regs)
5914 == register_number (i.op[2].regs)
5915 || register_number (i.op[1].regs)
5916 == register_number (i.op[2].regs))
5917 {
5918 i.error = invalid_tmm_register_set;
5919 return 1;
5920 }
5921 }
5922
5923 /* Check if broadcast is supported by the instruction and is applied
5924 to the memory operand. */
5925 if (i.broadcast)
5926 {
5927 i386_operand_type type, overlap;
5928
5929 /* Check if specified broadcast is supported in this instruction,
5930 and its broadcast bytes match the memory operand. */
5931 op = i.broadcast->operand;
5932 if (!t->opcode_modifier.broadcast
5933 || !(i.flags[op] & Operand_Mem)
5934 || (!i.types[op].bitfield.unspecified
5935 && !match_broadcast_size (t, op)))
5936 {
5937 bad_broadcast:
5938 i.error = unsupported_broadcast;
5939 return 1;
5940 }
5941
5942 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5943 * i.broadcast->type);
5944 operand_type_set (&type, 0);
5945 switch (i.broadcast->bytes)
5946 {
5947 case 2:
5948 type.bitfield.word = 1;
5949 break;
5950 case 4:
5951 type.bitfield.dword = 1;
5952 break;
5953 case 8:
5954 type.bitfield.qword = 1;
5955 break;
5956 case 16:
5957 type.bitfield.xmmword = 1;
5958 break;
5959 case 32:
5960 type.bitfield.ymmword = 1;
5961 break;
5962 case 64:
5963 type.bitfield.zmmword = 1;
5964 break;
5965 default:
5966 goto bad_broadcast;
5967 }
5968
5969 overlap = operand_type_and (type, t->operand_types[op]);
5970 if (t->operand_types[op].bitfield.class == RegSIMD
5971 && t->operand_types[op].bitfield.byte
5972 + t->operand_types[op].bitfield.word
5973 + t->operand_types[op].bitfield.dword
5974 + t->operand_types[op].bitfield.qword > 1)
5975 {
5976 overlap.bitfield.xmmword = 0;
5977 overlap.bitfield.ymmword = 0;
5978 overlap.bitfield.zmmword = 0;
5979 }
5980 if (operand_type_all_zero (&overlap))
5981 goto bad_broadcast;
5982
5983 if (t->opcode_modifier.checkregsize)
5984 {
5985 unsigned int j;
5986
5987 type.bitfield.baseindex = 1;
5988 for (j = 0; j < i.operands; ++j)
5989 {
5990 if (j != op
5991 && !operand_type_register_match(i.types[j],
5992 t->operand_types[j],
5993 type,
5994 t->operand_types[op]))
5995 goto bad_broadcast;
5996 }
5997 }
5998 }
5999 /* If broadcast is supported in this instruction, we need to check if
6000 operand of one-element size isn't specified without broadcast. */
6001 else if (t->opcode_modifier.broadcast && i.mem_operands)
6002 {
6003 /* Find memory operand. */
6004 for (op = 0; op < i.operands; op++)
6005 if (i.flags[op] & Operand_Mem)
6006 break;
6007 gas_assert (op < i.operands);
6008 /* Check size of the memory operand. */
6009 if (match_broadcast_size (t, op))
6010 {
6011 i.error = broadcast_needed;
6012 return 1;
6013 }
6014 }
6015 else
6016 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
6017
6018 /* Check if requested masking is supported. */
6019 if (i.mask)
6020 {
6021 switch (t->opcode_modifier.masking)
6022 {
6023 case BOTH_MASKING:
6024 break;
6025 case MERGING_MASKING:
6026 if (i.mask->zeroing)
6027 {
6028 case 0:
6029 i.error = unsupported_masking;
6030 return 1;
6031 }
6032 break;
6033 case DYNAMIC_MASKING:
6034 /* Memory destinations allow only merging masking. */
6035 if (i.mask->zeroing && i.mem_operands)
6036 {
6037 /* Find memory operand. */
6038 for (op = 0; op < i.operands; op++)
6039 if (i.flags[op] & Operand_Mem)
6040 break;
6041 gas_assert (op < i.operands);
6042 if (op == i.operands - 1)
6043 {
6044 i.error = unsupported_masking;
6045 return 1;
6046 }
6047 }
6048 break;
6049 default:
6050 abort ();
6051 }
6052 }
6053
6054 /* Check if masking is applied to dest operand. */
6055 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6056 {
6057 i.error = mask_not_on_destination;
6058 return 1;
6059 }
6060
6061 /* Check RC/SAE. */
6062 if (i.rounding)
6063 {
6064 if (!t->opcode_modifier.sae
6065 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6066 {
6067 i.error = unsupported_rc_sae;
6068 return 1;
6069 }
6070 /* If the instruction has several immediate operands and one of
6071 them is rounding, the rounding operand should be the last
6072 immediate operand. */
6073 if (i.imm_operands > 1
6074 && i.rounding->operand != (int) (i.imm_operands - 1))
6075 {
6076 i.error = rc_sae_operand_not_last_imm;
6077 return 1;
6078 }
6079 }
6080
6081 /* Check the special Imm4 cases; must be the first operand. */
6082 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6083 {
6084 if (i.op[0].imms->X_op != O_constant
6085 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6086 {
6087 i.error = bad_imm4;
6088 return 1;
6089 }
6090
6091 /* Turn off Imm<N> so that update_imm won't complain. */
6092 operand_type_set (&i.types[0], 0);
6093 }
6094
6095 /* Check vector Disp8 operand. */
6096 if (t->opcode_modifier.disp8memshift
6097 && i.disp_encoding != disp_encoding_32bit)
6098 {
6099 if (i.broadcast)
6100 i.memshift = t->opcode_modifier.broadcast - 1;
6101 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6102 i.memshift = t->opcode_modifier.disp8memshift;
6103 else
6104 {
6105 const i386_operand_type *type = NULL;
6106
6107 i.memshift = 0;
6108 for (op = 0; op < i.operands; op++)
6109 if (i.flags[op] & Operand_Mem)
6110 {
6111 if (t->opcode_modifier.evex == EVEXLIG)
6112 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6113 else if (t->operand_types[op].bitfield.xmmword
6114 + t->operand_types[op].bitfield.ymmword
6115 + t->operand_types[op].bitfield.zmmword <= 1)
6116 type = &t->operand_types[op];
6117 else if (!i.types[op].bitfield.unspecified)
6118 type = &i.types[op];
6119 }
6120 else if (i.types[op].bitfield.class == RegSIMD
6121 && t->opcode_modifier.evex != EVEXLIG)
6122 {
6123 if (i.types[op].bitfield.zmmword)
6124 i.memshift = 6;
6125 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6126 i.memshift = 5;
6127 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6128 i.memshift = 4;
6129 }
6130
6131 if (type)
6132 {
6133 if (type->bitfield.zmmword)
6134 i.memshift = 6;
6135 else if (type->bitfield.ymmword)
6136 i.memshift = 5;
6137 else if (type->bitfield.xmmword)
6138 i.memshift = 4;
6139 }
6140
6141 /* For the check in fits_in_disp8(). */
6142 if (i.memshift == 0)
6143 i.memshift = -1;
6144 }
6145
6146 for (op = 0; op < i.operands; op++)
6147 if (operand_type_check (i.types[op], disp)
6148 && i.op[op].disps->X_op == O_constant)
6149 {
6150 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6151 {
6152 i.types[op].bitfield.disp8 = 1;
6153 return 0;
6154 }
6155 i.types[op].bitfield.disp8 = 0;
6156 }
6157 }
6158
6159 i.memshift = 0;
6160
6161 return 0;
6162 }
6163
6164 /* Check if encoding requirements are met by the instruction. */
6165
6166 static int
6167 VEX_check_encoding (const insn_template *t)
6168 {
6169 if (i.vec_encoding == vex_encoding_error)
6170 {
6171 i.error = unsupported;
6172 return 1;
6173 }
6174
6175 if (i.vec_encoding == vex_encoding_evex)
6176 {
6177 /* This instruction must be encoded with EVEX prefix. */
6178 if (!is_evex_encoding (t))
6179 {
6180 i.error = unsupported;
6181 return 1;
6182 }
6183 return 0;
6184 }
6185
6186 if (!t->opcode_modifier.vex)
6187 {
6188 /* This instruction template doesn't have VEX prefix. */
6189 if (i.vec_encoding != vex_encoding_default)
6190 {
6191 i.error = unsupported;
6192 return 1;
6193 }
6194 return 0;
6195 }
6196
6197 return 0;
6198 }
6199
6200 static const insn_template *
6201 match_template (char mnem_suffix)
6202 {
6203 /* Points to template once we've found it. */
6204 const insn_template *t;
6205 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6206 i386_operand_type overlap4;
6207 unsigned int found_reverse_match;
6208 i386_opcode_modifier suffix_check;
6209 i386_operand_type operand_types [MAX_OPERANDS];
6210 int addr_prefix_disp;
6211 unsigned int j, size_match, check_register;
6212 enum i386_error specific_error = 0;
6213
6214 #if MAX_OPERANDS != 5
6215 # error "MAX_OPERANDS must be 5."
6216 #endif
6217
6218 found_reverse_match = 0;
6219 addr_prefix_disp = -1;
6220
6221 /* Prepare for mnemonic suffix check. */
6222 memset (&suffix_check, 0, sizeof (suffix_check));
6223 switch (mnem_suffix)
6224 {
6225 case BYTE_MNEM_SUFFIX:
6226 suffix_check.no_bsuf = 1;
6227 break;
6228 case WORD_MNEM_SUFFIX:
6229 suffix_check.no_wsuf = 1;
6230 break;
6231 case SHORT_MNEM_SUFFIX:
6232 suffix_check.no_ssuf = 1;
6233 break;
6234 case LONG_MNEM_SUFFIX:
6235 suffix_check.no_lsuf = 1;
6236 break;
6237 case QWORD_MNEM_SUFFIX:
6238 suffix_check.no_qsuf = 1;
6239 break;
6240 default:
6241 /* NB: In Intel syntax, normally we can check for memory operand
6242 size when there is no mnemonic suffix. But jmp and call have
6243 2 different encodings with Dword memory operand size, one with
6244 No_ldSuf and the other without. i.suffix is set to
6245 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6246 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6247 suffix_check.no_ldsuf = 1;
6248 }
6249
6250 /* Must have right number of operands. */
6251 i.error = number_of_operands_mismatch;
6252
6253 for (t = current_templates->start; t < current_templates->end; t++)
6254 {
6255 addr_prefix_disp = -1;
6256 found_reverse_match = 0;
6257
6258 if (i.operands != t->operands)
6259 continue;
6260
6261 /* Check processor support. */
6262 i.error = unsupported;
6263 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6264 continue;
6265
6266 /* Check Pseudo Prefix. */
6267 i.error = unsupported;
6268 if (t->opcode_modifier.pseudovexprefix
6269 && !(i.vec_encoding == vex_encoding_vex
6270 || i.vec_encoding == vex_encoding_vex3))
6271 continue;
6272
6273 /* Check AT&T mnemonic. */
6274 i.error = unsupported_with_intel_mnemonic;
6275 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6276 continue;
6277
6278 /* Check AT&T/Intel syntax. */
6279 i.error = unsupported_syntax;
6280 if ((intel_syntax && t->opcode_modifier.attsyntax)
6281 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6282 continue;
6283
6284 /* Check Intel64/AMD64 ISA. */
6285 switch (isa64)
6286 {
6287 default:
6288 /* Default: Don't accept Intel64. */
6289 if (t->opcode_modifier.isa64 == INTEL64)
6290 continue;
6291 break;
6292 case amd64:
6293 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6294 if (t->opcode_modifier.isa64 >= INTEL64)
6295 continue;
6296 break;
6297 case intel64:
6298 /* -mintel64: Don't accept AMD64. */
6299 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6300 continue;
6301 break;
6302 }
6303
6304 /* Check the suffix. */
6305 i.error = invalid_instruction_suffix;
6306 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6307 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6308 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6309 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6310 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6311 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6312 continue;
6313
6314 size_match = operand_size_match (t);
6315 if (!size_match)
6316 continue;
6317
6318 /* This is intentionally not
6319
6320 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6321
6322 as the case of a missing * on the operand is accepted (perhaps with
6323 a warning, issued further down). */
6324 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6325 {
6326 i.error = operand_type_mismatch;
6327 continue;
6328 }
6329
6330 for (j = 0; j < MAX_OPERANDS; j++)
6331 operand_types[j] = t->operand_types[j];
6332
6333 /* In general, don't allow
6334 - 64-bit operands outside of 64-bit mode,
6335 - 32-bit operands on pre-386. */
6336 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6337 if (((i.suffix == QWORD_MNEM_SUFFIX
6338 && flag_code != CODE_64BIT
6339 && !(t->base_opcode == 0xfc7
6340 && i.tm.opcode_modifier.opcodeprefix == 0
6341 && t->extension_opcode == 1) /* cmpxchg8b */)
6342 || (i.suffix == LONG_MNEM_SUFFIX
6343 && !cpu_arch_flags.bitfield.cpui386))
6344 && (intel_syntax
6345 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6346 && !intel_float_operand (t->name))
6347 : intel_float_operand (t->name) != 2)
6348 && (t->operands == i.imm_operands
6349 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6350 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6351 && operand_types[i.imm_operands].bitfield.class != RegMask)
6352 || (operand_types[j].bitfield.class != RegMMX
6353 && operand_types[j].bitfield.class != RegSIMD
6354 && operand_types[j].bitfield.class != RegMask))
6355 && !t->opcode_modifier.sib)
6356 continue;
6357
6358 /* Do not verify operands when there are none. */
6359 if (!t->operands)
6360 {
6361 if (VEX_check_encoding (t))
6362 {
6363 specific_error = i.error;
6364 continue;
6365 }
6366
6367 /* We've found a match; break out of loop. */
6368 break;
6369 }
6370
6371 if (!t->opcode_modifier.jump
6372 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6373 {
6374 /* There should be only one Disp operand. */
6375 for (j = 0; j < MAX_OPERANDS; j++)
6376 if (operand_type_check (operand_types[j], disp))
6377 break;
6378 if (j < MAX_OPERANDS)
6379 {
6380 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6381
6382 addr_prefix_disp = j;
6383
6384 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6385 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6386 switch (flag_code)
6387 {
6388 case CODE_16BIT:
6389 override = !override;
6390 /* Fall through. */
6391 case CODE_32BIT:
6392 if (operand_types[j].bitfield.disp32
6393 && operand_types[j].bitfield.disp16)
6394 {
6395 operand_types[j].bitfield.disp16 = override;
6396 operand_types[j].bitfield.disp32 = !override;
6397 }
6398 operand_types[j].bitfield.disp32s = 0;
6399 operand_types[j].bitfield.disp64 = 0;
6400 break;
6401
6402 case CODE_64BIT:
6403 if (operand_types[j].bitfield.disp32s
6404 || operand_types[j].bitfield.disp64)
6405 {
6406 operand_types[j].bitfield.disp64 &= !override;
6407 operand_types[j].bitfield.disp32s &= !override;
6408 operand_types[j].bitfield.disp32 = override;
6409 }
6410 operand_types[j].bitfield.disp16 = 0;
6411 break;
6412 }
6413 }
6414 }
6415
6416 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6417 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6418 continue;
6419
6420 /* We check register size if needed. */
6421 if (t->opcode_modifier.checkregsize)
6422 {
6423 check_register = (1 << t->operands) - 1;
6424 if (i.broadcast)
6425 check_register &= ~(1 << i.broadcast->operand);
6426 }
6427 else
6428 check_register = 0;
6429
6430 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6431 switch (t->operands)
6432 {
6433 case 1:
6434 if (!operand_type_match (overlap0, i.types[0]))
6435 continue;
6436 break;
6437 case 2:
6438 /* xchg %eax, %eax is a special case. It is an alias for nop
6439 only in 32bit mode and we can use opcode 0x90. In 64bit
6440 mode, we can't use 0x90 for xchg %eax, %eax since it should
6441 zero-extend %eax to %rax. */
6442 if (flag_code == CODE_64BIT
6443 && t->base_opcode == 0x90
6444 && i.types[0].bitfield.instance == Accum
6445 && i.types[0].bitfield.dword
6446 && i.types[1].bitfield.instance == Accum
6447 && i.types[1].bitfield.dword)
6448 continue;
6449 /* xrelease mov %eax, <disp> is another special case. It must not
6450 match the accumulator-only encoding of mov. */
6451 if (flag_code != CODE_64BIT
6452 && i.hle_prefix
6453 && t->base_opcode == 0xa0
6454 && i.types[0].bitfield.instance == Accum
6455 && (i.flags[1] & Operand_Mem))
6456 continue;
6457 /* Fall through. */
6458
6459 case 3:
6460 if (!(size_match & MATCH_STRAIGHT))
6461 goto check_reverse;
6462 /* Reverse direction of operands if swapping is possible in the first
6463 place (operands need to be symmetric) and
6464 - the load form is requested, and the template is a store form,
6465 - the store form is requested, and the template is a load form,
6466 - the non-default (swapped) form is requested. */
6467 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6468 if (t->opcode_modifier.d && i.reg_operands == i.operands
6469 && !operand_type_all_zero (&overlap1))
6470 switch (i.dir_encoding)
6471 {
6472 case dir_encoding_load:
6473 if (operand_type_check (operand_types[i.operands - 1], anymem)
6474 || t->opcode_modifier.regmem)
6475 goto check_reverse;
6476 break;
6477
6478 case dir_encoding_store:
6479 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6480 && !t->opcode_modifier.regmem)
6481 goto check_reverse;
6482 break;
6483
6484 case dir_encoding_swap:
6485 goto check_reverse;
6486
6487 case dir_encoding_default:
6488 break;
6489 }
6490 /* If we want store form, we skip the current load. */
6491 if ((i.dir_encoding == dir_encoding_store
6492 || i.dir_encoding == dir_encoding_swap)
6493 && i.mem_operands == 0
6494 && t->opcode_modifier.load)
6495 continue;
6496 /* Fall through. */
6497 case 4:
6498 case 5:
6499 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6500 if (!operand_type_match (overlap0, i.types[0])
6501 || !operand_type_match (overlap1, i.types[1])
6502 || ((check_register & 3) == 3
6503 && !operand_type_register_match (i.types[0],
6504 operand_types[0],
6505 i.types[1],
6506 operand_types[1])))
6507 {
6508 /* Check if other direction is valid ... */
6509 if (!t->opcode_modifier.d)
6510 continue;
6511
6512 check_reverse:
6513 if (!(size_match & MATCH_REVERSE))
6514 continue;
6515 /* Try reversing direction of operands. */
6516 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6517 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6518 if (!operand_type_match (overlap0, i.types[0])
6519 || !operand_type_match (overlap1, i.types[i.operands - 1])
6520 || (check_register
6521 && !operand_type_register_match (i.types[0],
6522 operand_types[i.operands - 1],
6523 i.types[i.operands - 1],
6524 operand_types[0])))
6525 {
6526 /* Does not match either direction. */
6527 continue;
6528 }
6529 /* found_reverse_match holds which of D or FloatR
6530 we've found. */
6531 if (!t->opcode_modifier.d)
6532 found_reverse_match = 0;
6533 else if (operand_types[0].bitfield.tbyte)
6534 found_reverse_match = Opcode_FloatD;
6535 else if (operand_types[0].bitfield.xmmword
6536 || operand_types[i.operands - 1].bitfield.xmmword
6537 || operand_types[0].bitfield.class == RegMMX
6538 || operand_types[i.operands - 1].bitfield.class == RegMMX
6539 || is_any_vex_encoding(t))
6540 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6541 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6542 else
6543 found_reverse_match = Opcode_D;
6544 if (t->opcode_modifier.floatr)
6545 found_reverse_match |= Opcode_FloatR;
6546 }
6547 else
6548 {
6549 /* Found a forward 2 operand match here. */
6550 switch (t->operands)
6551 {
6552 case 5:
6553 overlap4 = operand_type_and (i.types[4],
6554 operand_types[4]);
6555 /* Fall through. */
6556 case 4:
6557 overlap3 = operand_type_and (i.types[3],
6558 operand_types[3]);
6559 /* Fall through. */
6560 case 3:
6561 overlap2 = operand_type_and (i.types[2],
6562 operand_types[2]);
6563 break;
6564 }
6565
6566 switch (t->operands)
6567 {
6568 case 5:
6569 if (!operand_type_match (overlap4, i.types[4])
6570 || !operand_type_register_match (i.types[3],
6571 operand_types[3],
6572 i.types[4],
6573 operand_types[4]))
6574 continue;
6575 /* Fall through. */
6576 case 4:
6577 if (!operand_type_match (overlap3, i.types[3])
6578 || ((check_register & 0xa) == 0xa
6579 && !operand_type_register_match (i.types[1],
6580 operand_types[1],
6581 i.types[3],
6582 operand_types[3]))
6583 || ((check_register & 0xc) == 0xc
6584 && !operand_type_register_match (i.types[2],
6585 operand_types[2],
6586 i.types[3],
6587 operand_types[3])))
6588 continue;
6589 /* Fall through. */
6590 case 3:
6591 /* Here we make use of the fact that there are no
6592 reverse match 3 operand instructions. */
6593 if (!operand_type_match (overlap2, i.types[2])
6594 || ((check_register & 5) == 5
6595 && !operand_type_register_match (i.types[0],
6596 operand_types[0],
6597 i.types[2],
6598 operand_types[2]))
6599 || ((check_register & 6) == 6
6600 && !operand_type_register_match (i.types[1],
6601 operand_types[1],
6602 i.types[2],
6603 operand_types[2])))
6604 continue;
6605 break;
6606 }
6607 }
6608 /* Found either forward/reverse 2, 3 or 4 operand match here:
6609 slip through to break. */
6610 }
6611
6612 /* Check if vector operands are valid. */
6613 if (check_VecOperands (t))
6614 {
6615 specific_error = i.error;
6616 continue;
6617 }
6618
6619 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6620 if (VEX_check_encoding (t))
6621 {
6622 specific_error = i.error;
6623 continue;
6624 }
6625
6626 /* We've found a match; break out of loop. */
6627 break;
6628 }
6629
6630 if (t == current_templates->end)
6631 {
6632 /* We found no match. */
6633 const char *err_msg;
6634 switch (specific_error ? specific_error : i.error)
6635 {
6636 default:
6637 abort ();
6638 case operand_size_mismatch:
6639 err_msg = _("operand size mismatch");
6640 break;
6641 case operand_type_mismatch:
6642 err_msg = _("operand type mismatch");
6643 break;
6644 case register_type_mismatch:
6645 err_msg = _("register type mismatch");
6646 break;
6647 case number_of_operands_mismatch:
6648 err_msg = _("number of operands mismatch");
6649 break;
6650 case invalid_instruction_suffix:
6651 err_msg = _("invalid instruction suffix");
6652 break;
6653 case bad_imm4:
6654 err_msg = _("constant doesn't fit in 4 bits");
6655 break;
6656 case unsupported_with_intel_mnemonic:
6657 err_msg = _("unsupported with Intel mnemonic");
6658 break;
6659 case unsupported_syntax:
6660 err_msg = _("unsupported syntax");
6661 break;
6662 case unsupported:
6663 as_bad (_("unsupported instruction `%s'"),
6664 current_templates->start->name);
6665 return NULL;
6666 case invalid_sib_address:
6667 err_msg = _("invalid SIB address");
6668 break;
6669 case invalid_vsib_address:
6670 err_msg = _("invalid VSIB address");
6671 break;
6672 case invalid_vector_register_set:
6673 err_msg = _("mask, index, and destination registers must be distinct");
6674 break;
6675 case invalid_tmm_register_set:
6676 err_msg = _("all tmm registers must be distinct");
6677 break;
6678 case unsupported_vector_index_register:
6679 err_msg = _("unsupported vector index register");
6680 break;
6681 case unsupported_broadcast:
6682 err_msg = _("unsupported broadcast");
6683 break;
6684 case broadcast_needed:
6685 err_msg = _("broadcast is needed for operand of such type");
6686 break;
6687 case unsupported_masking:
6688 err_msg = _("unsupported masking");
6689 break;
6690 case mask_not_on_destination:
6691 err_msg = _("mask not on destination operand");
6692 break;
6693 case no_default_mask:
6694 err_msg = _("default mask isn't allowed");
6695 break;
6696 case unsupported_rc_sae:
6697 err_msg = _("unsupported static rounding/sae");
6698 break;
6699 case rc_sae_operand_not_last_imm:
6700 if (intel_syntax)
6701 err_msg = _("RC/SAE operand must precede immediate operands");
6702 else
6703 err_msg = _("RC/SAE operand must follow immediate operands");
6704 break;
6705 case invalid_register_operand:
6706 err_msg = _("invalid register operand");
6707 break;
6708 }
6709 as_bad (_("%s for `%s'"), err_msg,
6710 current_templates->start->name);
6711 return NULL;
6712 }
6713
6714 if (!quiet_warnings)
6715 {
6716 if (!intel_syntax
6717 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6718 as_warn (_("indirect %s without `*'"), t->name);
6719
6720 if (t->opcode_modifier.isprefix
6721 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6722 {
6723 /* Warn them that a data or address size prefix doesn't
6724 affect assembly of the next line of code. */
6725 as_warn (_("stand-alone `%s' prefix"), t->name);
6726 }
6727 }
6728
6729 /* Copy the template we found. */
6730 i.tm = *t;
6731
6732 if (addr_prefix_disp != -1)
6733 i.tm.operand_types[addr_prefix_disp]
6734 = operand_types[addr_prefix_disp];
6735
6736 if (found_reverse_match)
6737 {
6738 /* If we found a reverse match we must alter the opcode direction
6739 bit and clear/flip the regmem modifier one. found_reverse_match
6740 holds bits to change (different for int & float insns). */
6741
6742 i.tm.base_opcode ^= found_reverse_match;
6743
6744 i.tm.operand_types[0] = operand_types[i.operands - 1];
6745 i.tm.operand_types[i.operands - 1] = operand_types[0];
6746
6747 /* Certain SIMD insns have their load forms specified in the opcode
6748 table, and hence we need to _set_ RegMem instead of clearing it.
6749 We need to avoid setting the bit though on insns like KMOVW. */
6750 i.tm.opcode_modifier.regmem
6751 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6752 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6753 && !i.tm.opcode_modifier.regmem;
6754 }
6755
6756 return t;
6757 }
6758
6759 static int
6760 check_string (void)
6761 {
6762 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6763 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6764
6765 if (i.seg[op] != NULL && i.seg[op] != &es)
6766 {
6767 as_bad (_("`%s' operand %u must use `%ses' segment"),
6768 i.tm.name,
6769 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6770 register_prefix);
6771 return 0;
6772 }
6773
6774 /* There's only ever one segment override allowed per instruction.
6775 This instruction possibly has a legal segment override on the
6776 second operand, so copy the segment to where non-string
6777 instructions store it, allowing common code. */
6778 i.seg[op] = i.seg[1];
6779
6780 return 1;
6781 }
6782
6783 static int
6784 process_suffix (void)
6785 {
6786 bfd_boolean is_crc32 = FALSE;
6787
6788 /* If matched instruction specifies an explicit instruction mnemonic
6789 suffix, use it. */
6790 if (i.tm.opcode_modifier.size == SIZE16)
6791 i.suffix = WORD_MNEM_SUFFIX;
6792 else if (i.tm.opcode_modifier.size == SIZE32)
6793 i.suffix = LONG_MNEM_SUFFIX;
6794 else if (i.tm.opcode_modifier.size == SIZE64)
6795 i.suffix = QWORD_MNEM_SUFFIX;
6796 else if (i.reg_operands
6797 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6798 && !i.tm.opcode_modifier.addrprefixopreg)
6799 {
6800 unsigned int numop = i.operands;
6801 /* CRC32 */
6802 is_crc32 = (i.tm.base_opcode == 0xf38f0
6803 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6804
6805 /* movsx/movzx want only their source operand considered here, for the
6806 ambiguity checking below. The suffix will be replaced afterwards
6807 to represent the destination (register). */
6808 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6809 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6810 --i.operands;
6811
6812 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6813 if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
6814 i.rex |= REX_W;
6815
6816 /* If there's no instruction mnemonic suffix we try to invent one
6817 based on GPR operands. */
6818 if (!i.suffix)
6819 {
6820 /* We take i.suffix from the last register operand specified,
6821 Destination register type is more significant than source
6822 register type. crc32 in SSE4.2 prefers source register
6823 type. */
6824 unsigned int op = is_crc32 ? 1 : i.operands;
6825
6826 while (op--)
6827 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6828 || i.tm.operand_types[op].bitfield.instance == Accum)
6829 {
6830 if (i.types[op].bitfield.class != Reg)
6831 continue;
6832 if (i.types[op].bitfield.byte)
6833 i.suffix = BYTE_MNEM_SUFFIX;
6834 else if (i.types[op].bitfield.word)
6835 i.suffix = WORD_MNEM_SUFFIX;
6836 else if (i.types[op].bitfield.dword)
6837 i.suffix = LONG_MNEM_SUFFIX;
6838 else if (i.types[op].bitfield.qword)
6839 i.suffix = QWORD_MNEM_SUFFIX;
6840 else
6841 continue;
6842 break;
6843 }
6844
6845 /* As an exception, movsx/movzx silently default to a byte source
6846 in AT&T mode. */
6847 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6848 && !i.suffix && !intel_syntax)
6849 i.suffix = BYTE_MNEM_SUFFIX;
6850 }
6851 else if (i.suffix == BYTE_MNEM_SUFFIX)
6852 {
6853 if (intel_syntax
6854 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6855 && i.tm.opcode_modifier.no_bsuf)
6856 i.suffix = 0;
6857 else if (!check_byte_reg ())
6858 return 0;
6859 }
6860 else if (i.suffix == LONG_MNEM_SUFFIX)
6861 {
6862 if (intel_syntax
6863 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6864 && i.tm.opcode_modifier.no_lsuf
6865 && !i.tm.opcode_modifier.todword
6866 && !i.tm.opcode_modifier.toqword)
6867 i.suffix = 0;
6868 else if (!check_long_reg ())
6869 return 0;
6870 }
6871 else if (i.suffix == QWORD_MNEM_SUFFIX)
6872 {
6873 if (intel_syntax
6874 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6875 && i.tm.opcode_modifier.no_qsuf
6876 && !i.tm.opcode_modifier.todword
6877 && !i.tm.opcode_modifier.toqword)
6878 i.suffix = 0;
6879 else if (!check_qword_reg ())
6880 return 0;
6881 }
6882 else if (i.suffix == WORD_MNEM_SUFFIX)
6883 {
6884 if (intel_syntax
6885 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6886 && i.tm.opcode_modifier.no_wsuf)
6887 i.suffix = 0;
6888 else if (!check_word_reg ())
6889 return 0;
6890 }
6891 else if (intel_syntax
6892 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6893 /* Do nothing if the instruction is going to ignore the prefix. */
6894 ;
6895 else
6896 abort ();
6897
6898 /* Undo the movsx/movzx change done above. */
6899 i.operands = numop;
6900 }
6901 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6902 && !i.suffix)
6903 {
6904 i.suffix = stackop_size;
6905 if (stackop_size == LONG_MNEM_SUFFIX)
6906 {
6907 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6908 .code16gcc directive to support 16-bit mode with
6909 32-bit address. For IRET without a suffix, generate
6910 16-bit IRET (opcode 0xcf) to return from an interrupt
6911 handler. */
6912 if (i.tm.base_opcode == 0xcf)
6913 {
6914 i.suffix = WORD_MNEM_SUFFIX;
6915 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6916 }
6917 /* Warn about changed behavior for segment register push/pop. */
6918 else if ((i.tm.base_opcode | 1) == 0x07)
6919 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6920 i.tm.name);
6921 }
6922 }
6923 else if (!i.suffix
6924 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6925 || i.tm.opcode_modifier.jump == JUMP_BYTE
6926 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6927 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6928 && i.tm.extension_opcode <= 3)))
6929 {
6930 switch (flag_code)
6931 {
6932 case CODE_64BIT:
6933 if (!i.tm.opcode_modifier.no_qsuf)
6934 {
6935 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6936 || i.tm.opcode_modifier.no_lsuf)
6937 i.suffix = QWORD_MNEM_SUFFIX;
6938 break;
6939 }
6940 /* Fall through. */
6941 case CODE_32BIT:
6942 if (!i.tm.opcode_modifier.no_lsuf)
6943 i.suffix = LONG_MNEM_SUFFIX;
6944 break;
6945 case CODE_16BIT:
6946 if (!i.tm.opcode_modifier.no_wsuf)
6947 i.suffix = WORD_MNEM_SUFFIX;
6948 break;
6949 }
6950 }
6951
6952 if (!i.suffix
6953 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6954 /* Also cover lret/retf/iret in 64-bit mode. */
6955 || (flag_code == CODE_64BIT
6956 && !i.tm.opcode_modifier.no_lsuf
6957 && !i.tm.opcode_modifier.no_qsuf))
6958 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6959 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6960 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6961 /* Accept FLDENV et al without suffix. */
6962 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6963 {
6964 unsigned int suffixes, evex = 0;
6965
6966 suffixes = !i.tm.opcode_modifier.no_bsuf;
6967 if (!i.tm.opcode_modifier.no_wsuf)
6968 suffixes |= 1 << 1;
6969 if (!i.tm.opcode_modifier.no_lsuf)
6970 suffixes |= 1 << 2;
6971 if (!i.tm.opcode_modifier.no_ldsuf)
6972 suffixes |= 1 << 3;
6973 if (!i.tm.opcode_modifier.no_ssuf)
6974 suffixes |= 1 << 4;
6975 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6976 suffixes |= 1 << 5;
6977
6978 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6979 also suitable for AT&T syntax mode, it was requested that this be
6980 restricted to just Intel syntax. */
6981 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6982 {
6983 unsigned int op;
6984
6985 for (op = 0; op < i.tm.operands; ++op)
6986 {
6987 if (is_evex_encoding (&i.tm)
6988 && !cpu_arch_flags.bitfield.cpuavx512vl)
6989 {
6990 if (i.tm.operand_types[op].bitfield.ymmword)
6991 i.tm.operand_types[op].bitfield.xmmword = 0;
6992 if (i.tm.operand_types[op].bitfield.zmmword)
6993 i.tm.operand_types[op].bitfield.ymmword = 0;
6994 if (!i.tm.opcode_modifier.evex
6995 || i.tm.opcode_modifier.evex == EVEXDYN)
6996 i.tm.opcode_modifier.evex = EVEX512;
6997 }
6998
6999 if (i.tm.operand_types[op].bitfield.xmmword
7000 + i.tm.operand_types[op].bitfield.ymmword
7001 + i.tm.operand_types[op].bitfield.zmmword < 2)
7002 continue;
7003
7004 /* Any properly sized operand disambiguates the insn. */
7005 if (i.types[op].bitfield.xmmword
7006 || i.types[op].bitfield.ymmword
7007 || i.types[op].bitfield.zmmword)
7008 {
7009 suffixes &= ~(7 << 6);
7010 evex = 0;
7011 break;
7012 }
7013
7014 if ((i.flags[op] & Operand_Mem)
7015 && i.tm.operand_types[op].bitfield.unspecified)
7016 {
7017 if (i.tm.operand_types[op].bitfield.xmmword)
7018 suffixes |= 1 << 6;
7019 if (i.tm.operand_types[op].bitfield.ymmword)
7020 suffixes |= 1 << 7;
7021 if (i.tm.operand_types[op].bitfield.zmmword)
7022 suffixes |= 1 << 8;
7023 if (is_evex_encoding (&i.tm))
7024 evex = EVEX512;
7025 }
7026 }
7027 }
7028
7029 /* Are multiple suffixes / operand sizes allowed? */
7030 if (suffixes & (suffixes - 1))
7031 {
7032 if (intel_syntax
7033 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7034 || operand_check == check_error))
7035 {
7036 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
7037 return 0;
7038 }
7039 if (operand_check == check_error)
7040 {
7041 as_bad (_("no instruction mnemonic suffix given and "
7042 "no register operands; can't size `%s'"), i.tm.name);
7043 return 0;
7044 }
7045 if (operand_check == check_warning)
7046 as_warn (_("%s; using default for `%s'"),
7047 intel_syntax
7048 ? _("ambiguous operand size")
7049 : _("no instruction mnemonic suffix given and "
7050 "no register operands"),
7051 i.tm.name);
7052
7053 if (i.tm.opcode_modifier.floatmf)
7054 i.suffix = SHORT_MNEM_SUFFIX;
7055 else if ((i.tm.base_opcode | 8) == 0xfbe
7056 || (i.tm.base_opcode == 0x63
7057 && i.tm.cpu_flags.bitfield.cpu64))
7058 /* handled below */;
7059 else if (evex)
7060 i.tm.opcode_modifier.evex = evex;
7061 else if (flag_code == CODE_16BIT)
7062 i.suffix = WORD_MNEM_SUFFIX;
7063 else if (!i.tm.opcode_modifier.no_lsuf)
7064 i.suffix = LONG_MNEM_SUFFIX;
7065 else
7066 i.suffix = QWORD_MNEM_SUFFIX;
7067 }
7068 }
7069
7070 if ((i.tm.base_opcode | 8) == 0xfbe
7071 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7072 {
7073 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7074 In AT&T syntax, if there is no suffix (warned about above), the default
7075 will be byte extension. */
7076 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7077 i.tm.base_opcode |= 1;
7078
7079 /* For further processing, the suffix should represent the destination
7080 (register). This is already the case when one was used with
7081 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7082 no suffix to begin with. */
7083 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7084 {
7085 if (i.types[1].bitfield.word)
7086 i.suffix = WORD_MNEM_SUFFIX;
7087 else if (i.types[1].bitfield.qword)
7088 i.suffix = QWORD_MNEM_SUFFIX;
7089 else
7090 i.suffix = LONG_MNEM_SUFFIX;
7091
7092 i.tm.opcode_modifier.w = 0;
7093 }
7094 }
7095
7096 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7097 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7098 != (i.tm.operand_types[1].bitfield.class == Reg);
7099
7100 /* Change the opcode based on the operand size given by i.suffix. */
7101 switch (i.suffix)
7102 {
7103 /* Size floating point instruction. */
7104 case LONG_MNEM_SUFFIX:
7105 if (i.tm.opcode_modifier.floatmf)
7106 {
7107 i.tm.base_opcode ^= 4;
7108 break;
7109 }
7110 /* fall through */
7111 case WORD_MNEM_SUFFIX:
7112 case QWORD_MNEM_SUFFIX:
7113 /* It's not a byte, select word/dword operation. */
7114 if (i.tm.opcode_modifier.w)
7115 {
7116 if (i.short_form)
7117 i.tm.base_opcode |= 8;
7118 else
7119 i.tm.base_opcode |= 1;
7120 }
7121 /* fall through */
7122 case SHORT_MNEM_SUFFIX:
7123 /* Now select between word & dword operations via the operand
7124 size prefix, except for instructions that will ignore this
7125 prefix anyway. */
7126 if (i.suffix != QWORD_MNEM_SUFFIX
7127 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7128 && !i.tm.opcode_modifier.floatmf
7129 && !is_any_vex_encoding (&i.tm)
7130 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7131 || (flag_code == CODE_64BIT
7132 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7133 {
7134 unsigned int prefix = DATA_PREFIX_OPCODE;
7135
7136 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7137 prefix = ADDR_PREFIX_OPCODE;
7138
7139 if (!add_prefix (prefix))
7140 return 0;
7141 }
7142
7143 /* Set mode64 for an operand. */
7144 if (i.suffix == QWORD_MNEM_SUFFIX
7145 && flag_code == CODE_64BIT
7146 && !i.tm.opcode_modifier.norex64
7147 && !i.tm.opcode_modifier.vexw
7148 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7149 need rex64. */
7150 && ! (i.operands == 2
7151 && i.tm.base_opcode == 0x90
7152 && i.tm.extension_opcode == None
7153 && i.types[0].bitfield.instance == Accum
7154 && i.types[0].bitfield.qword
7155 && i.types[1].bitfield.instance == Accum
7156 && i.types[1].bitfield.qword))
7157 i.rex |= REX_W;
7158
7159 break;
7160
7161 case 0:
7162 /* Select word/dword/qword operation with explicit data sizing prefix
7163 when there are no suitable register operands. */
7164 if (i.tm.opcode_modifier.w
7165 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7166 && (!i.reg_operands
7167 || (i.reg_operands == 1
7168 /* ShiftCount */
7169 && (i.tm.operand_types[0].bitfield.instance == RegC
7170 /* InOutPortReg */
7171 || i.tm.operand_types[0].bitfield.instance == RegD
7172 || i.tm.operand_types[1].bitfield.instance == RegD
7173 /* CRC32 */
7174 || is_crc32))))
7175 i.tm.base_opcode |= 1;
7176 break;
7177 }
7178
7179 if (i.tm.opcode_modifier.addrprefixopreg)
7180 {
7181 gas_assert (!i.suffix);
7182 gas_assert (i.reg_operands);
7183
7184 if (i.tm.operand_types[0].bitfield.instance == Accum
7185 || i.operands == 1)
7186 {
7187 /* The address size override prefix changes the size of the
7188 first operand. */
7189 if (flag_code == CODE_64BIT
7190 && i.op[0].regs->reg_type.bitfield.word)
7191 {
7192 as_bad (_("16-bit addressing unavailable for `%s'"),
7193 i.tm.name);
7194 return 0;
7195 }
7196
7197 if ((flag_code == CODE_32BIT
7198 ? i.op[0].regs->reg_type.bitfield.word
7199 : i.op[0].regs->reg_type.bitfield.dword)
7200 && !add_prefix (ADDR_PREFIX_OPCODE))
7201 return 0;
7202 }
7203 else
7204 {
7205 /* Check invalid register operand when the address size override
7206 prefix changes the size of register operands. */
7207 unsigned int op;
7208 enum { need_word, need_dword, need_qword } need;
7209
7210 /* Check the register operand for the address size prefix if
7211 the memory operand has no real registers, like symbol, DISP
7212 or symbol(%rip). */
7213 if (i.mem_operands == 1
7214 && i.reg_operands == 1
7215 && i.operands == 2
7216 && i.types[1].bitfield.class == Reg
7217 && (flag_code == CODE_32BIT
7218 ? i.op[1].regs->reg_type.bitfield.word
7219 : i.op[1].regs->reg_type.bitfield.dword)
7220 && ((i.base_reg == NULL && i.index_reg == NULL)
7221 || (i.base_reg
7222 && i.base_reg->reg_num == RegIP
7223 && i.base_reg->reg_type.bitfield.qword))
7224 && !add_prefix (ADDR_PREFIX_OPCODE))
7225 return 0;
7226
7227 if (flag_code == CODE_32BIT)
7228 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7229 else if (i.prefix[ADDR_PREFIX])
7230 need = need_dword;
7231 else
7232 need = flag_code == CODE_64BIT ? need_qword : need_word;
7233
7234 for (op = 0; op < i.operands; op++)
7235 {
7236 if (i.types[op].bitfield.class != Reg)
7237 continue;
7238
7239 switch (need)
7240 {
7241 case need_word:
7242 if (i.op[op].regs->reg_type.bitfield.word)
7243 continue;
7244 break;
7245 case need_dword:
7246 if (i.op[op].regs->reg_type.bitfield.dword)
7247 continue;
7248 break;
7249 case need_qword:
7250 if (i.op[op].regs->reg_type.bitfield.qword)
7251 continue;
7252 break;
7253 }
7254
7255 as_bad (_("invalid register operand size for `%s'"),
7256 i.tm.name);
7257 return 0;
7258 }
7259 }
7260 }
7261
7262 return 1;
7263 }
7264
7265 static int
7266 check_byte_reg (void)
7267 {
7268 int op;
7269
7270 for (op = i.operands; --op >= 0;)
7271 {
7272 /* Skip non-register operands. */
7273 if (i.types[op].bitfield.class != Reg)
7274 continue;
7275
7276 /* If this is an eight bit register, it's OK. If it's the 16 or
7277 32 bit version of an eight bit register, we will just use the
7278 low portion, and that's OK too. */
7279 if (i.types[op].bitfield.byte)
7280 continue;
7281
7282 /* I/O port address operands are OK too. */
7283 if (i.tm.operand_types[op].bitfield.instance == RegD
7284 && i.tm.operand_types[op].bitfield.word)
7285 continue;
7286
7287 /* crc32 only wants its source operand checked here. */
7288 if (i.tm.base_opcode == 0xf38f0
7289 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7290 && op != 0)
7291 continue;
7292
7293 /* Any other register is bad. */
7294 as_bad (_("`%s%s' not allowed with `%s%c'"),
7295 register_prefix, i.op[op].regs->reg_name,
7296 i.tm.name, i.suffix);
7297 return 0;
7298 }
7299 return 1;
7300 }
7301
7302 static int
7303 check_long_reg (void)
7304 {
7305 int op;
7306
7307 for (op = i.operands; --op >= 0;)
7308 /* Skip non-register operands. */
7309 if (i.types[op].bitfield.class != Reg)
7310 continue;
7311 /* Reject eight bit registers, except where the template requires
7312 them. (eg. movzb) */
7313 else if (i.types[op].bitfield.byte
7314 && (i.tm.operand_types[op].bitfield.class == Reg
7315 || i.tm.operand_types[op].bitfield.instance == Accum)
7316 && (i.tm.operand_types[op].bitfield.word
7317 || i.tm.operand_types[op].bitfield.dword))
7318 {
7319 as_bad (_("`%s%s' not allowed with `%s%c'"),
7320 register_prefix,
7321 i.op[op].regs->reg_name,
7322 i.tm.name,
7323 i.suffix);
7324 return 0;
7325 }
7326 /* Error if the e prefix on a general reg is missing. */
7327 else if (i.types[op].bitfield.word
7328 && (i.tm.operand_types[op].bitfield.class == Reg
7329 || i.tm.operand_types[op].bitfield.instance == Accum)
7330 && i.tm.operand_types[op].bitfield.dword)
7331 {
7332 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7333 register_prefix, i.op[op].regs->reg_name,
7334 i.suffix);
7335 return 0;
7336 }
7337 /* Warn if the r prefix on a general reg is present. */
7338 else if (i.types[op].bitfield.qword
7339 && (i.tm.operand_types[op].bitfield.class == Reg
7340 || i.tm.operand_types[op].bitfield.instance == Accum)
7341 && i.tm.operand_types[op].bitfield.dword)
7342 {
7343 if (intel_syntax
7344 && i.tm.opcode_modifier.toqword
7345 && i.types[0].bitfield.class != RegSIMD)
7346 {
7347 /* Convert to QWORD. We want REX byte. */
7348 i.suffix = QWORD_MNEM_SUFFIX;
7349 }
7350 else
7351 {
7352 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7353 register_prefix, i.op[op].regs->reg_name,
7354 i.suffix);
7355 return 0;
7356 }
7357 }
7358 return 1;
7359 }
7360
7361 static int
7362 check_qword_reg (void)
7363 {
7364 int op;
7365
7366 for (op = i.operands; --op >= 0; )
7367 /* Skip non-register operands. */
7368 if (i.types[op].bitfield.class != Reg)
7369 continue;
7370 /* Reject eight bit registers, except where the template requires
7371 them. (eg. movzb) */
7372 else if (i.types[op].bitfield.byte
7373 && (i.tm.operand_types[op].bitfield.class == Reg
7374 || i.tm.operand_types[op].bitfield.instance == Accum)
7375 && (i.tm.operand_types[op].bitfield.word
7376 || i.tm.operand_types[op].bitfield.dword))
7377 {
7378 as_bad (_("`%s%s' not allowed with `%s%c'"),
7379 register_prefix,
7380 i.op[op].regs->reg_name,
7381 i.tm.name,
7382 i.suffix);
7383 return 0;
7384 }
7385 /* Warn if the r prefix on a general reg is missing. */
7386 else if ((i.types[op].bitfield.word
7387 || i.types[op].bitfield.dword)
7388 && (i.tm.operand_types[op].bitfield.class == Reg
7389 || i.tm.operand_types[op].bitfield.instance == Accum)
7390 && i.tm.operand_types[op].bitfield.qword)
7391 {
7392 /* Prohibit these changes in the 64bit mode, since the
7393 lowering is more complicated. */
7394 if (intel_syntax
7395 && i.tm.opcode_modifier.todword
7396 && i.types[0].bitfield.class != RegSIMD)
7397 {
7398 /* Convert to DWORD. We don't want REX byte. */
7399 i.suffix = LONG_MNEM_SUFFIX;
7400 }
7401 else
7402 {
7403 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7404 register_prefix, i.op[op].regs->reg_name,
7405 i.suffix);
7406 return 0;
7407 }
7408 }
7409 return 1;
7410 }
7411
7412 static int
7413 check_word_reg (void)
7414 {
7415 int op;
7416 for (op = i.operands; --op >= 0;)
7417 /* Skip non-register operands. */
7418 if (i.types[op].bitfield.class != Reg)
7419 continue;
7420 /* Reject eight bit registers, except where the template requires
7421 them. (eg. movzb) */
7422 else if (i.types[op].bitfield.byte
7423 && (i.tm.operand_types[op].bitfield.class == Reg
7424 || i.tm.operand_types[op].bitfield.instance == Accum)
7425 && (i.tm.operand_types[op].bitfield.word
7426 || i.tm.operand_types[op].bitfield.dword))
7427 {
7428 as_bad (_("`%s%s' not allowed with `%s%c'"),
7429 register_prefix,
7430 i.op[op].regs->reg_name,
7431 i.tm.name,
7432 i.suffix);
7433 return 0;
7434 }
7435 /* Error if the e or r prefix on a general reg is present. */
7436 else if ((i.types[op].bitfield.dword
7437 || i.types[op].bitfield.qword)
7438 && (i.tm.operand_types[op].bitfield.class == Reg
7439 || i.tm.operand_types[op].bitfield.instance == Accum)
7440 && i.tm.operand_types[op].bitfield.word)
7441 {
7442 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7443 register_prefix, i.op[op].regs->reg_name,
7444 i.suffix);
7445 return 0;
7446 }
7447 return 1;
7448 }
7449
7450 static int
7451 update_imm (unsigned int j)
7452 {
7453 i386_operand_type overlap = i.types[j];
7454 if ((overlap.bitfield.imm8
7455 || overlap.bitfield.imm8s
7456 || overlap.bitfield.imm16
7457 || overlap.bitfield.imm32
7458 || overlap.bitfield.imm32s
7459 || overlap.bitfield.imm64)
7460 && !operand_type_equal (&overlap, &imm8)
7461 && !operand_type_equal (&overlap, &imm8s)
7462 && !operand_type_equal (&overlap, &imm16)
7463 && !operand_type_equal (&overlap, &imm32)
7464 && !operand_type_equal (&overlap, &imm32s)
7465 && !operand_type_equal (&overlap, &imm64))
7466 {
7467 if (i.suffix)
7468 {
7469 i386_operand_type temp;
7470
7471 operand_type_set (&temp, 0);
7472 if (i.suffix == BYTE_MNEM_SUFFIX)
7473 {
7474 temp.bitfield.imm8 = overlap.bitfield.imm8;
7475 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7476 }
7477 else if (i.suffix == WORD_MNEM_SUFFIX)
7478 temp.bitfield.imm16 = overlap.bitfield.imm16;
7479 else if (i.suffix == QWORD_MNEM_SUFFIX)
7480 {
7481 temp.bitfield.imm64 = overlap.bitfield.imm64;
7482 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7483 }
7484 else
7485 temp.bitfield.imm32 = overlap.bitfield.imm32;
7486 overlap = temp;
7487 }
7488 else if (operand_type_equal (&overlap, &imm16_32_32s)
7489 || operand_type_equal (&overlap, &imm16_32)
7490 || operand_type_equal (&overlap, &imm16_32s))
7491 {
7492 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7493 overlap = imm16;
7494 else
7495 overlap = imm32s;
7496 }
7497 else if (i.prefix[REX_PREFIX] & REX_W)
7498 overlap = operand_type_and (overlap, imm32s);
7499 else if (i.prefix[DATA_PREFIX])
7500 overlap = operand_type_and (overlap,
7501 flag_code != CODE_16BIT ? imm16 : imm32);
7502 if (!operand_type_equal (&overlap, &imm8)
7503 && !operand_type_equal (&overlap, &imm8s)
7504 && !operand_type_equal (&overlap, &imm16)
7505 && !operand_type_equal (&overlap, &imm32)
7506 && !operand_type_equal (&overlap, &imm32s)
7507 && !operand_type_equal (&overlap, &imm64))
7508 {
7509 as_bad (_("no instruction mnemonic suffix given; "
7510 "can't determine immediate size"));
7511 return 0;
7512 }
7513 }
7514 i.types[j] = overlap;
7515
7516 return 1;
7517 }
7518
7519 static int
7520 finalize_imm (void)
7521 {
7522 unsigned int j, n;
7523
7524 /* Update the first 2 immediate operands. */
7525 n = i.operands > 2 ? 2 : i.operands;
7526 if (n)
7527 {
7528 for (j = 0; j < n; j++)
7529 if (update_imm (j) == 0)
7530 return 0;
7531
7532 /* The 3rd operand can't be immediate operand. */
7533 gas_assert (operand_type_check (i.types[2], imm) == 0);
7534 }
7535
7536 return 1;
7537 }
7538
7539 static int
7540 process_operands (void)
7541 {
7542 /* Default segment register this instruction will use for memory
7543 accesses. 0 means unknown. This is only for optimizing out
7544 unnecessary segment overrides. */
7545 const seg_entry *default_seg = 0;
7546
7547 if (i.tm.opcode_modifier.sse2avx)
7548 {
7549 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7550 need converting. */
7551 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7552 i.prefix[REX_PREFIX] = 0;
7553 i.rex_encoding = 0;
7554 }
7555 /* ImmExt should be processed after SSE2AVX. */
7556 else if (i.tm.opcode_modifier.immext)
7557 process_immext ();
7558
7559 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7560 {
7561 unsigned int dupl = i.operands;
7562 unsigned int dest = dupl - 1;
7563 unsigned int j;
7564
7565 /* The destination must be an xmm register. */
7566 gas_assert (i.reg_operands
7567 && MAX_OPERANDS > dupl
7568 && operand_type_equal (&i.types[dest], &regxmm));
7569
7570 if (i.tm.operand_types[0].bitfield.instance == Accum
7571 && i.tm.operand_types[0].bitfield.xmmword)
7572 {
7573 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7574 {
7575 /* Keep xmm0 for instructions with VEX prefix and 3
7576 sources. */
7577 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7578 i.tm.operand_types[0].bitfield.class = RegSIMD;
7579 goto duplicate;
7580 }
7581 else
7582 {
7583 /* We remove the first xmm0 and keep the number of
7584 operands unchanged, which in fact duplicates the
7585 destination. */
7586 for (j = 1; j < i.operands; j++)
7587 {
7588 i.op[j - 1] = i.op[j];
7589 i.types[j - 1] = i.types[j];
7590 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7591 i.flags[j - 1] = i.flags[j];
7592 }
7593 }
7594 }
7595 else if (i.tm.opcode_modifier.implicit1stxmm0)
7596 {
7597 gas_assert ((MAX_OPERANDS - 1) > dupl
7598 && (i.tm.opcode_modifier.vexsources
7599 == VEX3SOURCES));
7600
7601 /* Add the implicit xmm0 for instructions with VEX prefix
7602 and 3 sources. */
7603 for (j = i.operands; j > 0; j--)
7604 {
7605 i.op[j] = i.op[j - 1];
7606 i.types[j] = i.types[j - 1];
7607 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7608 i.flags[j] = i.flags[j - 1];
7609 }
7610 i.op[0].regs
7611 = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7612 i.types[0] = regxmm;
7613 i.tm.operand_types[0] = regxmm;
7614
7615 i.operands += 2;
7616 i.reg_operands += 2;
7617 i.tm.operands += 2;
7618
7619 dupl++;
7620 dest++;
7621 i.op[dupl] = i.op[dest];
7622 i.types[dupl] = i.types[dest];
7623 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7624 i.flags[dupl] = i.flags[dest];
7625 }
7626 else
7627 {
7628 duplicate:
7629 i.operands++;
7630 i.reg_operands++;
7631 i.tm.operands++;
7632
7633 i.op[dupl] = i.op[dest];
7634 i.types[dupl] = i.types[dest];
7635 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7636 i.flags[dupl] = i.flags[dest];
7637 }
7638
7639 if (i.tm.opcode_modifier.immext)
7640 process_immext ();
7641 }
7642 else if (i.tm.operand_types[0].bitfield.instance == Accum
7643 && i.tm.operand_types[0].bitfield.xmmword)
7644 {
7645 unsigned int j;
7646
7647 for (j = 1; j < i.operands; j++)
7648 {
7649 i.op[j - 1] = i.op[j];
7650 i.types[j - 1] = i.types[j];
7651
7652 /* We need to adjust fields in i.tm since they are used by
7653 build_modrm_byte. */
7654 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7655
7656 i.flags[j - 1] = i.flags[j];
7657 }
7658
7659 i.operands--;
7660 i.reg_operands--;
7661 i.tm.operands--;
7662 }
7663 else if (i.tm.opcode_modifier.implicitquadgroup)
7664 {
7665 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7666
7667 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7668 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7669 regnum = register_number (i.op[1].regs);
7670 first_reg_in_group = regnum & ~3;
7671 last_reg_in_group = first_reg_in_group + 3;
7672 if (regnum != first_reg_in_group)
7673 as_warn (_("source register `%s%s' implicitly denotes"
7674 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7675 register_prefix, i.op[1].regs->reg_name,
7676 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7677 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7678 i.tm.name);
7679 }
7680 else if (i.tm.opcode_modifier.regkludge)
7681 {
7682 /* The imul $imm, %reg instruction is converted into
7683 imul $imm, %reg, %reg, and the clr %reg instruction
7684 is converted into xor %reg, %reg. */
7685
7686 unsigned int first_reg_op;
7687
7688 if (operand_type_check (i.types[0], reg))
7689 first_reg_op = 0;
7690 else
7691 first_reg_op = 1;
7692 /* Pretend we saw the extra register operand. */
7693 gas_assert (i.reg_operands == 1
7694 && i.op[first_reg_op + 1].regs == 0);
7695 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7696 i.types[first_reg_op + 1] = i.types[first_reg_op];
7697 i.operands++;
7698 i.reg_operands++;
7699 }
7700
7701 if (i.tm.opcode_modifier.modrm)
7702 {
7703 /* The opcode is completed (modulo i.tm.extension_opcode which
7704 must be put into the modrm byte). Now, we make the modrm and
7705 index base bytes based on all the info we've collected. */
7706
7707 default_seg = build_modrm_byte ();
7708 }
7709 else if (i.types[0].bitfield.class == SReg)
7710 {
7711 if (flag_code != CODE_64BIT
7712 ? i.tm.base_opcode == POP_SEG_SHORT
7713 && i.op[0].regs->reg_num == 1
7714 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7715 && i.op[0].regs->reg_num < 4)
7716 {
7717 as_bad (_("you can't `%s %s%s'"),
7718 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7719 return 0;
7720 }
7721 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7722 {
7723 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7724 i.tm.opcode_length = 2;
7725 }
7726 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7727 }
7728 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7729 {
7730 default_seg = &ds;
7731 }
7732 else if (i.tm.opcode_modifier.isstring)
7733 {
7734 /* For the string instructions that allow a segment override
7735 on one of their operands, the default segment is ds. */
7736 default_seg = &ds;
7737 }
7738 else if (i.short_form)
7739 {
7740 /* The register or float register operand is in operand
7741 0 or 1. */
7742 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7743
7744 /* Register goes in low 3 bits of opcode. */
7745 i.tm.base_opcode |= i.op[op].regs->reg_num;
7746 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7747 i.rex |= REX_B;
7748 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7749 {
7750 /* Warn about some common errors, but press on regardless.
7751 The first case can be generated by gcc (<= 2.8.1). */
7752 if (i.operands == 2)
7753 {
7754 /* Reversed arguments on faddp, fsubp, etc. */
7755 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7756 register_prefix, i.op[!intel_syntax].regs->reg_name,
7757 register_prefix, i.op[intel_syntax].regs->reg_name);
7758 }
7759 else
7760 {
7761 /* Extraneous `l' suffix on fp insn. */
7762 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7763 register_prefix, i.op[0].regs->reg_name);
7764 }
7765 }
7766 }
7767
7768 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7769 && i.tm.base_opcode == 0x8d /* lea */
7770 && !is_any_vex_encoding(&i.tm))
7771 {
7772 if (!quiet_warnings)
7773 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7774 if (optimize)
7775 {
7776 i.seg[0] = NULL;
7777 i.prefix[SEG_PREFIX] = 0;
7778 }
7779 }
7780
7781 /* If a segment was explicitly specified, and the specified segment
7782 is neither the default nor the one already recorded from a prefix,
7783 use an opcode prefix to select it. If we never figured out what
7784 the default segment is, then default_seg will be zero at this
7785 point, and the specified segment prefix will always be used. */
7786 if (i.seg[0]
7787 && i.seg[0] != default_seg
7788 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7789 {
7790 if (!add_prefix (i.seg[0]->seg_prefix))
7791 return 0;
7792 }
7793 return 1;
7794 }
7795
7796 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7797 bfd_boolean do_sse2avx)
7798 {
7799 if (r->reg_flags & RegRex)
7800 {
7801 if (i.rex & rex_bit)
7802 as_bad (_("same type of prefix used twice"));
7803 i.rex |= rex_bit;
7804 }
7805 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7806 {
7807 gas_assert (i.vex.register_specifier == r);
7808 i.vex.register_specifier += 8;
7809 }
7810
7811 if (r->reg_flags & RegVRex)
7812 i.vrex |= rex_bit;
7813 }
7814
7815 static const seg_entry *
7816 build_modrm_byte (void)
7817 {
7818 const seg_entry *default_seg = 0;
7819 unsigned int source, dest;
7820 int vex_3_sources;
7821
7822 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7823 if (vex_3_sources)
7824 {
7825 unsigned int nds, reg_slot;
7826 expressionS *exp;
7827
7828 dest = i.operands - 1;
7829 nds = dest - 1;
7830
7831 /* There are 2 kinds of instructions:
7832 1. 5 operands: 4 register operands or 3 register operands
7833 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7834 VexW0 or VexW1. The destination must be either XMM, YMM or
7835 ZMM register.
7836 2. 4 operands: 4 register operands or 3 register operands
7837 plus 1 memory operand, with VexXDS. */
7838 gas_assert ((i.reg_operands == 4
7839 || (i.reg_operands == 3 && i.mem_operands == 1))
7840 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7841 && i.tm.opcode_modifier.vexw
7842 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7843
7844 /* If VexW1 is set, the first non-immediate operand is the source and
7845 the second non-immediate one is encoded in the immediate operand. */
7846 if (i.tm.opcode_modifier.vexw == VEXW1)
7847 {
7848 source = i.imm_operands;
7849 reg_slot = i.imm_operands + 1;
7850 }
7851 else
7852 {
7853 source = i.imm_operands + 1;
7854 reg_slot = i.imm_operands;
7855 }
7856
7857 if (i.imm_operands == 0)
7858 {
7859 /* When there is no immediate operand, generate an 8bit
7860 immediate operand to encode the first operand. */
7861 exp = &im_expressions[i.imm_operands++];
7862 i.op[i.operands].imms = exp;
7863 i.types[i.operands] = imm8;
7864 i.operands++;
7865
7866 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7867 exp->X_op = O_constant;
7868 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7869 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7870 }
7871 else
7872 {
7873 gas_assert (i.imm_operands == 1);
7874 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7875 gas_assert (!i.tm.opcode_modifier.immext);
7876
7877 /* Turn on Imm8 again so that output_imm will generate it. */
7878 i.types[0].bitfield.imm8 = 1;
7879
7880 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7881 i.op[0].imms->X_add_number
7882 |= register_number (i.op[reg_slot].regs) << 4;
7883 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7884 }
7885
7886 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7887 i.vex.register_specifier = i.op[nds].regs;
7888 }
7889 else
7890 source = dest = 0;
7891
7892 /* i.reg_operands MUST be the number of real register operands;
7893 implicit registers do not count. If there are 3 register
7894 operands, it must be a instruction with VexNDS. For a
7895 instruction with VexNDD, the destination register is encoded
7896 in VEX prefix. If there are 4 register operands, it must be
7897 a instruction with VEX prefix and 3 sources. */
7898 if (i.mem_operands == 0
7899 && ((i.reg_operands == 2
7900 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7901 || (i.reg_operands == 3
7902 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7903 || (i.reg_operands == 4 && vex_3_sources)))
7904 {
7905 switch (i.operands)
7906 {
7907 case 2:
7908 source = 0;
7909 break;
7910 case 3:
7911 /* When there are 3 operands, one of them may be immediate,
7912 which may be the first or the last operand. Otherwise,
7913 the first operand must be shift count register (cl) or it
7914 is an instruction with VexNDS. */
7915 gas_assert (i.imm_operands == 1
7916 || (i.imm_operands == 0
7917 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7918 || (i.types[0].bitfield.instance == RegC
7919 && i.types[0].bitfield.byte))));
7920 if (operand_type_check (i.types[0], imm)
7921 || (i.types[0].bitfield.instance == RegC
7922 && i.types[0].bitfield.byte))
7923 source = 1;
7924 else
7925 source = 0;
7926 break;
7927 case 4:
7928 /* When there are 4 operands, the first two must be 8bit
7929 immediate operands. The source operand will be the 3rd
7930 one.
7931
7932 For instructions with VexNDS, if the first operand
7933 an imm8, the source operand is the 2nd one. If the last
7934 operand is imm8, the source operand is the first one. */
7935 gas_assert ((i.imm_operands == 2
7936 && i.types[0].bitfield.imm8
7937 && i.types[1].bitfield.imm8)
7938 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7939 && i.imm_operands == 1
7940 && (i.types[0].bitfield.imm8
7941 || i.types[i.operands - 1].bitfield.imm8
7942 || i.rounding)));
7943 if (i.imm_operands == 2)
7944 source = 2;
7945 else
7946 {
7947 if (i.types[0].bitfield.imm8)
7948 source = 1;
7949 else
7950 source = 0;
7951 }
7952 break;
7953 case 5:
7954 if (is_evex_encoding (&i.tm))
7955 {
7956 /* For EVEX instructions, when there are 5 operands, the
7957 first one must be immediate operand. If the second one
7958 is immediate operand, the source operand is the 3th
7959 one. If the last one is immediate operand, the source
7960 operand is the 2nd one. */
7961 gas_assert (i.imm_operands == 2
7962 && i.tm.opcode_modifier.sae
7963 && operand_type_check (i.types[0], imm));
7964 if (operand_type_check (i.types[1], imm))
7965 source = 2;
7966 else if (operand_type_check (i.types[4], imm))
7967 source = 1;
7968 else
7969 abort ();
7970 }
7971 break;
7972 default:
7973 abort ();
7974 }
7975
7976 if (!vex_3_sources)
7977 {
7978 dest = source + 1;
7979
7980 /* RC/SAE operand could be between DEST and SRC. That happens
7981 when one operand is GPR and the other one is XMM/YMM/ZMM
7982 register. */
7983 if (i.rounding && i.rounding->operand == (int) dest)
7984 dest++;
7985
7986 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7987 {
7988 /* For instructions with VexNDS, the register-only source
7989 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7990 register. It is encoded in VEX prefix. */
7991
7992 i386_operand_type op;
7993 unsigned int vvvv;
7994
7995 /* Swap two source operands if needed. */
7996 if (i.tm.opcode_modifier.swapsources)
7997 {
7998 vvvv = source;
7999 source = dest;
8000 }
8001 else
8002 vvvv = dest;
8003
8004 op = i.tm.operand_types[vvvv];
8005 if ((dest + 1) >= i.operands
8006 || ((op.bitfield.class != Reg
8007 || (!op.bitfield.dword && !op.bitfield.qword))
8008 && op.bitfield.class != RegSIMD
8009 && !operand_type_equal (&op, &regmask)))
8010 abort ();
8011 i.vex.register_specifier = i.op[vvvv].regs;
8012 dest++;
8013 }
8014 }
8015
8016 i.rm.mode = 3;
8017 /* One of the register operands will be encoded in the i.rm.reg
8018 field, the other in the combined i.rm.mode and i.rm.regmem
8019 fields. If no form of this instruction supports a memory
8020 destination operand, then we assume the source operand may
8021 sometimes be a memory operand and so we need to store the
8022 destination in the i.rm.reg field. */
8023 if (!i.tm.opcode_modifier.regmem
8024 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
8025 {
8026 i.rm.reg = i.op[dest].regs->reg_num;
8027 i.rm.regmem = i.op[source].regs->reg_num;
8028 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
8029 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
8030 }
8031 else
8032 {
8033 i.rm.reg = i.op[source].regs->reg_num;
8034 i.rm.regmem = i.op[dest].regs->reg_num;
8035 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8036 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8037 }
8038 if (flag_code != CODE_64BIT && (i.rex & REX_R))
8039 {
8040 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8041 abort ();
8042 i.rex &= ~REX_R;
8043 add_prefix (LOCK_PREFIX_OPCODE);
8044 }
8045 }
8046 else
8047 { /* If it's not 2 reg operands... */
8048 unsigned int mem;
8049
8050 if (i.mem_operands)
8051 {
8052 unsigned int fake_zero_displacement = 0;
8053 unsigned int op;
8054
8055 for (op = 0; op < i.operands; op++)
8056 if (i.flags[op] & Operand_Mem)
8057 break;
8058 gas_assert (op < i.operands);
8059
8060 if (i.tm.opcode_modifier.sib)
8061 {
8062 /* The index register of VSIB shouldn't be RegIZ. */
8063 if (i.tm.opcode_modifier.sib != SIBMEM
8064 && i.index_reg->reg_num == RegIZ)
8065 abort ();
8066
8067 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8068 if (!i.base_reg)
8069 {
8070 i.sib.base = NO_BASE_REGISTER;
8071 i.sib.scale = i.log2_scale_factor;
8072 i.types[op].bitfield.disp8 = 0;
8073 i.types[op].bitfield.disp16 = 0;
8074 i.types[op].bitfield.disp64 = 0;
8075 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8076 {
8077 /* Must be 32 bit */
8078 i.types[op].bitfield.disp32 = 1;
8079 i.types[op].bitfield.disp32s = 0;
8080 }
8081 else
8082 {
8083 i.types[op].bitfield.disp32 = 0;
8084 i.types[op].bitfield.disp32s = 1;
8085 }
8086 }
8087
8088 /* Since the mandatory SIB always has index register, so
8089 the code logic remains unchanged. The non-mandatory SIB
8090 without index register is allowed and will be handled
8091 later. */
8092 if (i.index_reg)
8093 {
8094 if (i.index_reg->reg_num == RegIZ)
8095 i.sib.index = NO_INDEX_REGISTER;
8096 else
8097 i.sib.index = i.index_reg->reg_num;
8098 set_rex_vrex (i.index_reg, REX_X, FALSE);
8099 }
8100 }
8101
8102 default_seg = &ds;
8103
8104 if (i.base_reg == 0)
8105 {
8106 i.rm.mode = 0;
8107 if (!i.disp_operands)
8108 fake_zero_displacement = 1;
8109 if (i.index_reg == 0)
8110 {
8111 i386_operand_type newdisp;
8112
8113 /* Both check for VSIB and mandatory non-vector SIB. */
8114 gas_assert (!i.tm.opcode_modifier.sib
8115 || i.tm.opcode_modifier.sib == SIBMEM);
8116 /* Operand is just <disp> */
8117 if (flag_code == CODE_64BIT)
8118 {
8119 /* 64bit mode overwrites the 32bit absolute
8120 addressing by RIP relative addressing and
8121 absolute addressing is encoded by one of the
8122 redundant SIB forms. */
8123 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8124 i.sib.base = NO_BASE_REGISTER;
8125 i.sib.index = NO_INDEX_REGISTER;
8126 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8127 }
8128 else if ((flag_code == CODE_16BIT)
8129 ^ (i.prefix[ADDR_PREFIX] != 0))
8130 {
8131 i.rm.regmem = NO_BASE_REGISTER_16;
8132 newdisp = disp16;
8133 }
8134 else
8135 {
8136 i.rm.regmem = NO_BASE_REGISTER;
8137 newdisp = disp32;
8138 }
8139 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8140 i.types[op] = operand_type_or (i.types[op], newdisp);
8141 }
8142 else if (!i.tm.opcode_modifier.sib)
8143 {
8144 /* !i.base_reg && i.index_reg */
8145 if (i.index_reg->reg_num == RegIZ)
8146 i.sib.index = NO_INDEX_REGISTER;
8147 else
8148 i.sib.index = i.index_reg->reg_num;
8149 i.sib.base = NO_BASE_REGISTER;
8150 i.sib.scale = i.log2_scale_factor;
8151 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8152 i.types[op].bitfield.disp8 = 0;
8153 i.types[op].bitfield.disp16 = 0;
8154 i.types[op].bitfield.disp64 = 0;
8155 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8156 {
8157 /* Must be 32 bit */
8158 i.types[op].bitfield.disp32 = 1;
8159 i.types[op].bitfield.disp32s = 0;
8160 }
8161 else
8162 {
8163 i.types[op].bitfield.disp32 = 0;
8164 i.types[op].bitfield.disp32s = 1;
8165 }
8166 if ((i.index_reg->reg_flags & RegRex) != 0)
8167 i.rex |= REX_X;
8168 }
8169 }
8170 /* RIP addressing for 64bit mode. */
8171 else if (i.base_reg->reg_num == RegIP)
8172 {
8173 gas_assert (!i.tm.opcode_modifier.sib);
8174 i.rm.regmem = NO_BASE_REGISTER;
8175 i.types[op].bitfield.disp8 = 0;
8176 i.types[op].bitfield.disp16 = 0;
8177 i.types[op].bitfield.disp32 = 0;
8178 i.types[op].bitfield.disp32s = 1;
8179 i.types[op].bitfield.disp64 = 0;
8180 i.flags[op] |= Operand_PCrel;
8181 if (! i.disp_operands)
8182 fake_zero_displacement = 1;
8183 }
8184 else if (i.base_reg->reg_type.bitfield.word)
8185 {
8186 gas_assert (!i.tm.opcode_modifier.sib);
8187 switch (i.base_reg->reg_num)
8188 {
8189 case 3: /* (%bx) */
8190 if (i.index_reg == 0)
8191 i.rm.regmem = 7;
8192 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8193 i.rm.regmem = i.index_reg->reg_num - 6;
8194 break;
8195 case 5: /* (%bp) */
8196 default_seg = &ss;
8197 if (i.index_reg == 0)
8198 {
8199 i.rm.regmem = 6;
8200 if (operand_type_check (i.types[op], disp) == 0)
8201 {
8202 /* fake (%bp) into 0(%bp) */
8203 if (i.disp_encoding == disp_encoding_16bit)
8204 i.types[op].bitfield.disp16 = 1;
8205 else
8206 i.types[op].bitfield.disp8 = 1;
8207 fake_zero_displacement = 1;
8208 }
8209 }
8210 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8211 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8212 break;
8213 default: /* (%si) -> 4 or (%di) -> 5 */
8214 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8215 }
8216 if (!fake_zero_displacement
8217 && !i.disp_operands
8218 && i.disp_encoding)
8219 {
8220 fake_zero_displacement = 1;
8221 if (i.disp_encoding == disp_encoding_8bit)
8222 i.types[op].bitfield.disp8 = 1;
8223 else
8224 i.types[op].bitfield.disp16 = 1;
8225 }
8226 i.rm.mode = mode_from_disp_size (i.types[op]);
8227 }
8228 else /* i.base_reg and 32/64 bit mode */
8229 {
8230 if (flag_code == CODE_64BIT
8231 && operand_type_check (i.types[op], disp))
8232 {
8233 i.types[op].bitfield.disp16 = 0;
8234 i.types[op].bitfield.disp64 = 0;
8235 if (i.prefix[ADDR_PREFIX] == 0)
8236 {
8237 i.types[op].bitfield.disp32 = 0;
8238 i.types[op].bitfield.disp32s = 1;
8239 }
8240 else
8241 {
8242 i.types[op].bitfield.disp32 = 1;
8243 i.types[op].bitfield.disp32s = 0;
8244 }
8245 }
8246
8247 if (!i.tm.opcode_modifier.sib)
8248 i.rm.regmem = i.base_reg->reg_num;
8249 if ((i.base_reg->reg_flags & RegRex) != 0)
8250 i.rex |= REX_B;
8251 i.sib.base = i.base_reg->reg_num;
8252 /* x86-64 ignores REX prefix bit here to avoid decoder
8253 complications. */
8254 if (!(i.base_reg->reg_flags & RegRex)
8255 && (i.base_reg->reg_num == EBP_REG_NUM
8256 || i.base_reg->reg_num == ESP_REG_NUM))
8257 default_seg = &ss;
8258 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8259 {
8260 fake_zero_displacement = 1;
8261 if (i.disp_encoding == disp_encoding_32bit)
8262 i.types[op].bitfield.disp32 = 1;
8263 else
8264 i.types[op].bitfield.disp8 = 1;
8265 }
8266 i.sib.scale = i.log2_scale_factor;
8267 if (i.index_reg == 0)
8268 {
8269 /* Only check for VSIB. */
8270 gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8271 && i.tm.opcode_modifier.sib != VECSIB256
8272 && i.tm.opcode_modifier.sib != VECSIB512);
8273
8274 /* <disp>(%esp) becomes two byte modrm with no index
8275 register. We've already stored the code for esp
8276 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8277 Any base register besides %esp will not use the
8278 extra modrm byte. */
8279 i.sib.index = NO_INDEX_REGISTER;
8280 }
8281 else if (!i.tm.opcode_modifier.sib)
8282 {
8283 if (i.index_reg->reg_num == RegIZ)
8284 i.sib.index = NO_INDEX_REGISTER;
8285 else
8286 i.sib.index = i.index_reg->reg_num;
8287 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8288 if ((i.index_reg->reg_flags & RegRex) != 0)
8289 i.rex |= REX_X;
8290 }
8291
8292 if (i.disp_operands
8293 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8294 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8295 i.rm.mode = 0;
8296 else
8297 {
8298 if (!fake_zero_displacement
8299 && !i.disp_operands
8300 && i.disp_encoding)
8301 {
8302 fake_zero_displacement = 1;
8303 if (i.disp_encoding == disp_encoding_8bit)
8304 i.types[op].bitfield.disp8 = 1;
8305 else
8306 i.types[op].bitfield.disp32 = 1;
8307 }
8308 i.rm.mode = mode_from_disp_size (i.types[op]);
8309 }
8310 }
8311
8312 if (fake_zero_displacement)
8313 {
8314 /* Fakes a zero displacement assuming that i.types[op]
8315 holds the correct displacement size. */
8316 expressionS *exp;
8317
8318 gas_assert (i.op[op].disps == 0);
8319 exp = &disp_expressions[i.disp_operands++];
8320 i.op[op].disps = exp;
8321 exp->X_op = O_constant;
8322 exp->X_add_number = 0;
8323 exp->X_add_symbol = (symbolS *) 0;
8324 exp->X_op_symbol = (symbolS *) 0;
8325 }
8326
8327 mem = op;
8328 }
8329 else
8330 mem = ~0;
8331
8332 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8333 {
8334 if (operand_type_check (i.types[0], imm))
8335 i.vex.register_specifier = NULL;
8336 else
8337 {
8338 /* VEX.vvvv encodes one of the sources when the first
8339 operand is not an immediate. */
8340 if (i.tm.opcode_modifier.vexw == VEXW0)
8341 i.vex.register_specifier = i.op[0].regs;
8342 else
8343 i.vex.register_specifier = i.op[1].regs;
8344 }
8345
8346 /* Destination is a XMM register encoded in the ModRM.reg
8347 and VEX.R bit. */
8348 i.rm.reg = i.op[2].regs->reg_num;
8349 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8350 i.rex |= REX_R;
8351
8352 /* ModRM.rm and VEX.B encodes the other source. */
8353 if (!i.mem_operands)
8354 {
8355 i.rm.mode = 3;
8356
8357 if (i.tm.opcode_modifier.vexw == VEXW0)
8358 i.rm.regmem = i.op[1].regs->reg_num;
8359 else
8360 i.rm.regmem = i.op[0].regs->reg_num;
8361
8362 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8363 i.rex |= REX_B;
8364 }
8365 }
8366 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8367 {
8368 i.vex.register_specifier = i.op[2].regs;
8369 if (!i.mem_operands)
8370 {
8371 i.rm.mode = 3;
8372 i.rm.regmem = i.op[1].regs->reg_num;
8373 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8374 i.rex |= REX_B;
8375 }
8376 }
8377 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8378 (if any) based on i.tm.extension_opcode. Again, we must be
8379 careful to make sure that segment/control/debug/test/MMX
8380 registers are coded into the i.rm.reg field. */
8381 else if (i.reg_operands)
8382 {
8383 unsigned int op;
8384 unsigned int vex_reg = ~0;
8385
8386 for (op = 0; op < i.operands; op++)
8387 if (i.types[op].bitfield.class == Reg
8388 || i.types[op].bitfield.class == RegBND
8389 || i.types[op].bitfield.class == RegMask
8390 || i.types[op].bitfield.class == SReg
8391 || i.types[op].bitfield.class == RegCR
8392 || i.types[op].bitfield.class == RegDR
8393 || i.types[op].bitfield.class == RegTR
8394 || i.types[op].bitfield.class == RegSIMD
8395 || i.types[op].bitfield.class == RegMMX)
8396 break;
8397
8398 if (vex_3_sources)
8399 op = dest;
8400 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8401 {
8402 /* For instructions with VexNDS, the register-only
8403 source operand is encoded in VEX prefix. */
8404 gas_assert (mem != (unsigned int) ~0);
8405
8406 if (op > mem)
8407 {
8408 vex_reg = op++;
8409 gas_assert (op < i.operands);
8410 }
8411 else
8412 {
8413 /* Check register-only source operand when two source
8414 operands are swapped. */
8415 if (!i.tm.operand_types[op].bitfield.baseindex
8416 && i.tm.operand_types[op + 1].bitfield.baseindex)
8417 {
8418 vex_reg = op;
8419 op += 2;
8420 gas_assert (mem == (vex_reg + 1)
8421 && op < i.operands);
8422 }
8423 else
8424 {
8425 vex_reg = op + 1;
8426 gas_assert (vex_reg < i.operands);
8427 }
8428 }
8429 }
8430 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8431 {
8432 /* For instructions with VexNDD, the register destination
8433 is encoded in VEX prefix. */
8434 if (i.mem_operands == 0)
8435 {
8436 /* There is no memory operand. */
8437 gas_assert ((op + 2) == i.operands);
8438 vex_reg = op + 1;
8439 }
8440 else
8441 {
8442 /* There are only 2 non-immediate operands. */
8443 gas_assert (op < i.imm_operands + 2
8444 && i.operands == i.imm_operands + 2);
8445 vex_reg = i.imm_operands + 1;
8446 }
8447 }
8448 else
8449 gas_assert (op < i.operands);
8450
8451 if (vex_reg != (unsigned int) ~0)
8452 {
8453 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8454
8455 if ((type->bitfield.class != Reg
8456 || (!type->bitfield.dword && !type->bitfield.qword))
8457 && type->bitfield.class != RegSIMD
8458 && !operand_type_equal (type, &regmask))
8459 abort ();
8460
8461 i.vex.register_specifier = i.op[vex_reg].regs;
8462 }
8463
8464 /* Don't set OP operand twice. */
8465 if (vex_reg != op)
8466 {
8467 /* If there is an extension opcode to put here, the
8468 register number must be put into the regmem field. */
8469 if (i.tm.extension_opcode != None)
8470 {
8471 i.rm.regmem = i.op[op].regs->reg_num;
8472 set_rex_vrex (i.op[op].regs, REX_B,
8473 i.tm.opcode_modifier.sse2avx);
8474 }
8475 else
8476 {
8477 i.rm.reg = i.op[op].regs->reg_num;
8478 set_rex_vrex (i.op[op].regs, REX_R,
8479 i.tm.opcode_modifier.sse2avx);
8480 }
8481 }
8482
8483 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8484 must set it to 3 to indicate this is a register operand
8485 in the regmem field. */
8486 if (!i.mem_operands)
8487 i.rm.mode = 3;
8488 }
8489
8490 /* Fill in i.rm.reg field with extension opcode (if any). */
8491 if (i.tm.extension_opcode != None)
8492 i.rm.reg = i.tm.extension_opcode;
8493 }
8494 return default_seg;
8495 }
8496
8497 static INLINE void
8498 frag_opcode_byte (unsigned char byte)
8499 {
8500 if (now_seg != absolute_section)
8501 FRAG_APPEND_1_CHAR (byte);
8502 else
8503 ++abs_section_offset;
8504 }
8505
8506 static unsigned int
8507 flip_code16 (unsigned int code16)
8508 {
8509 gas_assert (i.tm.operands == 1);
8510
8511 return !(i.prefix[REX_PREFIX] & REX_W)
8512 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8513 || i.tm.operand_types[0].bitfield.disp32s
8514 : i.tm.operand_types[0].bitfield.disp16)
8515 ? CODE16 : 0;
8516 }
8517
8518 static void
8519 output_branch (void)
8520 {
8521 char *p;
8522 int size;
8523 int code16;
8524 int prefix;
8525 relax_substateT subtype;
8526 symbolS *sym;
8527 offsetT off;
8528
8529 if (now_seg == absolute_section)
8530 {
8531 as_bad (_("relaxable branches not supported in absolute section"));
8532 return;
8533 }
8534
8535 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8536 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8537
8538 prefix = 0;
8539 if (i.prefix[DATA_PREFIX] != 0)
8540 {
8541 prefix = 1;
8542 i.prefixes -= 1;
8543 code16 ^= flip_code16(code16);
8544 }
8545 /* Pentium4 branch hints. */
8546 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8547 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8548 {
8549 prefix++;
8550 i.prefixes--;
8551 }
8552 if (i.prefix[REX_PREFIX] != 0)
8553 {
8554 prefix++;
8555 i.prefixes--;
8556 }
8557
8558 /* BND prefixed jump. */
8559 if (i.prefix[BND_PREFIX] != 0)
8560 {
8561 prefix++;
8562 i.prefixes--;
8563 }
8564
8565 if (i.prefixes != 0)
8566 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8567
8568 /* It's always a symbol; End frag & setup for relax.
8569 Make sure there is enough room in this frag for the largest
8570 instruction we may generate in md_convert_frag. This is 2
8571 bytes for the opcode and room for the prefix and largest
8572 displacement. */
8573 frag_grow (prefix + 2 + 4);
8574 /* Prefix and 1 opcode byte go in fr_fix. */
8575 p = frag_more (prefix + 1);
8576 if (i.prefix[DATA_PREFIX] != 0)
8577 *p++ = DATA_PREFIX_OPCODE;
8578 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8579 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8580 *p++ = i.prefix[SEG_PREFIX];
8581 if (i.prefix[BND_PREFIX] != 0)
8582 *p++ = BND_PREFIX_OPCODE;
8583 if (i.prefix[REX_PREFIX] != 0)
8584 *p++ = i.prefix[REX_PREFIX];
8585 *p = i.tm.base_opcode;
8586
8587 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8588 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8589 else if (cpu_arch_flags.bitfield.cpui386)
8590 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8591 else
8592 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8593 subtype |= code16;
8594
8595 sym = i.op[0].disps->X_add_symbol;
8596 off = i.op[0].disps->X_add_number;
8597
8598 if (i.op[0].disps->X_op != O_constant
8599 && i.op[0].disps->X_op != O_symbol)
8600 {
8601 /* Handle complex expressions. */
8602 sym = make_expr_symbol (i.op[0].disps);
8603 off = 0;
8604 }
8605
8606 /* 1 possible extra opcode + 4 byte displacement go in var part.
8607 Pass reloc in fr_var. */
8608 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8609 }
8610
8611 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8612 /* Return TRUE iff PLT32 relocation should be used for branching to
8613 symbol S. */
8614
8615 static bfd_boolean
8616 need_plt32_p (symbolS *s)
8617 {
8618 /* PLT32 relocation is ELF only. */
8619 if (!IS_ELF)
8620 return FALSE;
8621
8622 #ifdef TE_SOLARIS
8623 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8624 krtld support it. */
8625 return FALSE;
8626 #endif
8627
8628 /* Since there is no need to prepare for PLT branch on x86-64, we
8629 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8630 be used as a marker for 32-bit PC-relative branches. */
8631 if (!object_64bit)
8632 return FALSE;
8633
8634 if (s == NULL)
8635 return FALSE;
8636
8637 /* Weak or undefined symbol need PLT32 relocation. */
8638 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8639 return TRUE;
8640
8641 /* Non-global symbol doesn't need PLT32 relocation. */
8642 if (! S_IS_EXTERNAL (s))
8643 return FALSE;
8644
8645 /* Other global symbols need PLT32 relocation. NB: Symbol with
8646 non-default visibilities are treated as normal global symbol
8647 so that PLT32 relocation can be used as a marker for 32-bit
8648 PC-relative branches. It is useful for linker relaxation. */
8649 return TRUE;
8650 }
8651 #endif
8652
8653 static void
8654 output_jump (void)
8655 {
8656 char *p;
8657 int size;
8658 fixS *fixP;
8659 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8660
8661 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8662 {
8663 /* This is a loop or jecxz type instruction. */
8664 size = 1;
8665 if (i.prefix[ADDR_PREFIX] != 0)
8666 {
8667 frag_opcode_byte (ADDR_PREFIX_OPCODE);
8668 i.prefixes -= 1;
8669 }
8670 /* Pentium4 branch hints. */
8671 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8672 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8673 {
8674 frag_opcode_byte (i.prefix[SEG_PREFIX]);
8675 i.prefixes--;
8676 }
8677 }
8678 else
8679 {
8680 int code16;
8681
8682 code16 = 0;
8683 if (flag_code == CODE_16BIT)
8684 code16 = CODE16;
8685
8686 if (i.prefix[DATA_PREFIX] != 0)
8687 {
8688 frag_opcode_byte (DATA_PREFIX_OPCODE);
8689 i.prefixes -= 1;
8690 code16 ^= flip_code16(code16);
8691 }
8692
8693 size = 4;
8694 if (code16)
8695 size = 2;
8696 }
8697
8698 /* BND prefixed jump. */
8699 if (i.prefix[BND_PREFIX] != 0)
8700 {
8701 frag_opcode_byte (i.prefix[BND_PREFIX]);
8702 i.prefixes -= 1;
8703 }
8704
8705 if (i.prefix[REX_PREFIX] != 0)
8706 {
8707 frag_opcode_byte (i.prefix[REX_PREFIX]);
8708 i.prefixes -= 1;
8709 }
8710
8711 if (i.prefixes != 0)
8712 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8713
8714 if (now_seg == absolute_section)
8715 {
8716 abs_section_offset += i.tm.opcode_length + size;
8717 return;
8718 }
8719
8720 p = frag_more (i.tm.opcode_length + size);
8721 switch (i.tm.opcode_length)
8722 {
8723 case 2:
8724 *p++ = i.tm.base_opcode >> 8;
8725 /* Fall through. */
8726 case 1:
8727 *p++ = i.tm.base_opcode;
8728 break;
8729 default:
8730 abort ();
8731 }
8732
8733 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8734 if (size == 4
8735 && jump_reloc == NO_RELOC
8736 && need_plt32_p (i.op[0].disps->X_add_symbol))
8737 jump_reloc = BFD_RELOC_X86_64_PLT32;
8738 #endif
8739
8740 jump_reloc = reloc (size, 1, 1, jump_reloc);
8741
8742 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8743 i.op[0].disps, 1, jump_reloc);
8744
8745 /* All jumps handled here are signed, but don't use a signed limit
8746 check for 32 and 16 bit jumps as we want to allow wrap around at
8747 4G and 64k respectively. */
8748 if (size == 1)
8749 fixP->fx_signed = 1;
8750 }
8751
8752 static void
8753 output_interseg_jump (void)
8754 {
8755 char *p;
8756 int size;
8757 int prefix;
8758 int code16;
8759
8760 code16 = 0;
8761 if (flag_code == CODE_16BIT)
8762 code16 = CODE16;
8763
8764 prefix = 0;
8765 if (i.prefix[DATA_PREFIX] != 0)
8766 {
8767 prefix = 1;
8768 i.prefixes -= 1;
8769 code16 ^= CODE16;
8770 }
8771
8772 gas_assert (!i.prefix[REX_PREFIX]);
8773
8774 size = 4;
8775 if (code16)
8776 size = 2;
8777
8778 if (i.prefixes != 0)
8779 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8780
8781 if (now_seg == absolute_section)
8782 {
8783 abs_section_offset += prefix + 1 + 2 + size;
8784 return;
8785 }
8786
8787 /* 1 opcode; 2 segment; offset */
8788 p = frag_more (prefix + 1 + 2 + size);
8789
8790 if (i.prefix[DATA_PREFIX] != 0)
8791 *p++ = DATA_PREFIX_OPCODE;
8792
8793 if (i.prefix[REX_PREFIX] != 0)
8794 *p++ = i.prefix[REX_PREFIX];
8795
8796 *p++ = i.tm.base_opcode;
8797 if (i.op[1].imms->X_op == O_constant)
8798 {
8799 offsetT n = i.op[1].imms->X_add_number;
8800
8801 if (size == 2
8802 && !fits_in_unsigned_word (n)
8803 && !fits_in_signed_word (n))
8804 {
8805 as_bad (_("16-bit jump out of range"));
8806 return;
8807 }
8808 md_number_to_chars (p, n, size);
8809 }
8810 else
8811 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8812 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8813
8814 p += size;
8815 if (i.op[0].imms->X_op == O_constant)
8816 md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8817 else
8818 fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8819 i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8820 }
8821
8822 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8823 void
8824 x86_cleanup (void)
8825 {
8826 char *p;
8827 asection *seg = now_seg;
8828 subsegT subseg = now_subseg;
8829 asection *sec;
8830 unsigned int alignment, align_size_1;
8831 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8832 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8833 unsigned int padding;
8834
8835 if (!IS_ELF || !x86_used_note)
8836 return;
8837
8838 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8839
8840 /* The .note.gnu.property section layout:
8841
8842 Field Length Contents
8843 ---- ---- ----
8844 n_namsz 4 4
8845 n_descsz 4 The note descriptor size
8846 n_type 4 NT_GNU_PROPERTY_TYPE_0
8847 n_name 4 "GNU"
8848 n_desc n_descsz The program property array
8849 .... .... ....
8850 */
8851
8852 /* Create the .note.gnu.property section. */
8853 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8854 bfd_set_section_flags (sec,
8855 (SEC_ALLOC
8856 | SEC_LOAD
8857 | SEC_DATA
8858 | SEC_HAS_CONTENTS
8859 | SEC_READONLY));
8860
8861 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8862 {
8863 align_size_1 = 7;
8864 alignment = 3;
8865 }
8866 else
8867 {
8868 align_size_1 = 3;
8869 alignment = 2;
8870 }
8871
8872 bfd_set_section_alignment (sec, alignment);
8873 elf_section_type (sec) = SHT_NOTE;
8874
8875 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8876 + 4-byte data */
8877 isa_1_descsz_raw = 4 + 4 + 4;
8878 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8879 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8880
8881 feature_2_descsz_raw = isa_1_descsz;
8882 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8883 + 4-byte data */
8884 feature_2_descsz_raw += 4 + 4 + 4;
8885 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8886 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8887 & ~align_size_1);
8888
8889 descsz = feature_2_descsz;
8890 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8891 p = frag_more (4 + 4 + 4 + 4 + descsz);
8892
8893 /* Write n_namsz. */
8894 md_number_to_chars (p, (valueT) 4, 4);
8895
8896 /* Write n_descsz. */
8897 md_number_to_chars (p + 4, (valueT) descsz, 4);
8898
8899 /* Write n_type. */
8900 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8901
8902 /* Write n_name. */
8903 memcpy (p + 4 * 3, "GNU", 4);
8904
8905 /* Write 4-byte type. */
8906 md_number_to_chars (p + 4 * 4,
8907 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8908
8909 /* Write 4-byte data size. */
8910 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8911
8912 /* Write 4-byte data. */
8913 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8914
8915 /* Zero out paddings. */
8916 padding = isa_1_descsz - isa_1_descsz_raw;
8917 if (padding)
8918 memset (p + 4 * 7, 0, padding);
8919
8920 /* Write 4-byte type. */
8921 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8922 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8923
8924 /* Write 4-byte data size. */
8925 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8926
8927 /* Write 4-byte data. */
8928 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8929 (valueT) x86_feature_2_used, 4);
8930
8931 /* Zero out paddings. */
8932 padding = feature_2_descsz - feature_2_descsz_raw;
8933 if (padding)
8934 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8935
8936 /* We probably can't restore the current segment, for there likely
8937 isn't one yet... */
8938 if (seg && subseg)
8939 subseg_set (seg, subseg);
8940 }
8941 #endif
8942
8943 static unsigned int
8944 encoding_length (const fragS *start_frag, offsetT start_off,
8945 const char *frag_now_ptr)
8946 {
8947 unsigned int len = 0;
8948
8949 if (start_frag != frag_now)
8950 {
8951 const fragS *fr = start_frag;
8952
8953 do {
8954 len += fr->fr_fix;
8955 fr = fr->fr_next;
8956 } while (fr && fr != frag_now);
8957 }
8958
8959 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8960 }
8961
8962 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8963 be macro-fused with conditional jumps.
8964 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8965 or is one of the following format:
8966
8967 cmp m, imm
8968 add m, imm
8969 sub m, imm
8970 test m, imm
8971 and m, imm
8972 inc m
8973 dec m
8974
8975 it is unfusible. */
8976
8977 static int
8978 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8979 {
8980 /* No RIP address. */
8981 if (i.base_reg && i.base_reg->reg_num == RegIP)
8982 return 0;
8983
8984 /* No VEX/EVEX encoding. */
8985 if (is_any_vex_encoding (&i.tm))
8986 return 0;
8987
8988 /* add, sub without add/sub m, imm. */
8989 if (i.tm.base_opcode <= 5
8990 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8991 || ((i.tm.base_opcode | 3) == 0x83
8992 && (i.tm.extension_opcode == 0x5
8993 || i.tm.extension_opcode == 0x0)))
8994 {
8995 *mf_cmp_p = mf_cmp_alu_cmp;
8996 return !(i.mem_operands && i.imm_operands);
8997 }
8998
8999 /* and without and m, imm. */
9000 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
9001 || ((i.tm.base_opcode | 3) == 0x83
9002 && i.tm.extension_opcode == 0x4))
9003 {
9004 *mf_cmp_p = mf_cmp_test_and;
9005 return !(i.mem_operands && i.imm_operands);
9006 }
9007
9008 /* test without test m imm. */
9009 if ((i.tm.base_opcode | 1) == 0x85
9010 || (i.tm.base_opcode | 1) == 0xa9
9011 || ((i.tm.base_opcode | 1) == 0xf7
9012 && i.tm.extension_opcode == 0))
9013 {
9014 *mf_cmp_p = mf_cmp_test_and;
9015 return !(i.mem_operands && i.imm_operands);
9016 }
9017
9018 /* cmp without cmp m, imm. */
9019 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
9020 || ((i.tm.base_opcode | 3) == 0x83
9021 && (i.tm.extension_opcode == 0x7)))
9022 {
9023 *mf_cmp_p = mf_cmp_alu_cmp;
9024 return !(i.mem_operands && i.imm_operands);
9025 }
9026
9027 /* inc, dec without inc/dec m. */
9028 if ((i.tm.cpu_flags.bitfield.cpuno64
9029 && (i.tm.base_opcode | 0xf) == 0x4f)
9030 || ((i.tm.base_opcode | 1) == 0xff
9031 && i.tm.extension_opcode <= 0x1))
9032 {
9033 *mf_cmp_p = mf_cmp_incdec;
9034 return !i.mem_operands;
9035 }
9036
9037 return 0;
9038 }
9039
9040 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
9041
9042 static int
9043 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9044 {
9045 /* NB: Don't work with COND_JUMP86 without i386. */
9046 if (!align_branch_power
9047 || now_seg == absolute_section
9048 || !cpu_arch_flags.bitfield.cpui386
9049 || !(align_branch & align_branch_fused_bit))
9050 return 0;
9051
9052 if (maybe_fused_with_jcc_p (mf_cmp_p))
9053 {
9054 if (last_insn.kind == last_insn_other
9055 || last_insn.seg != now_seg)
9056 return 1;
9057 if (flag_debug)
9058 as_warn_where (last_insn.file, last_insn.line,
9059 _("`%s` skips -malign-branch-boundary on `%s`"),
9060 last_insn.name, i.tm.name);
9061 }
9062
9063 return 0;
9064 }
9065
9066 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
9067
9068 static int
9069 add_branch_prefix_frag_p (void)
9070 {
9071 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
9072 to PadLock instructions since they include prefixes in opcode. */
9073 if (!align_branch_power
9074 || !align_branch_prefix_size
9075 || now_seg == absolute_section
9076 || i.tm.cpu_flags.bitfield.cpupadlock
9077 || !cpu_arch_flags.bitfield.cpui386)
9078 return 0;
9079
9080 /* Don't add prefix if it is a prefix or there is no operand in case
9081 that segment prefix is special. */
9082 if (!i.operands || i.tm.opcode_modifier.isprefix)
9083 return 0;
9084
9085 if (last_insn.kind == last_insn_other
9086 || last_insn.seg != now_seg)
9087 return 1;
9088
9089 if (flag_debug)
9090 as_warn_where (last_insn.file, last_insn.line,
9091 _("`%s` skips -malign-branch-boundary on `%s`"),
9092 last_insn.name, i.tm.name);
9093
9094 return 0;
9095 }
9096
9097 /* Return 1 if a BRANCH_PADDING frag should be generated. */
9098
9099 static int
9100 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9101 enum mf_jcc_kind *mf_jcc_p)
9102 {
9103 int add_padding;
9104
9105 /* NB: Don't work with COND_JUMP86 without i386. */
9106 if (!align_branch_power
9107 || now_seg == absolute_section
9108 || !cpu_arch_flags.bitfield.cpui386)
9109 return 0;
9110
9111 add_padding = 0;
9112
9113 /* Check for jcc and direct jmp. */
9114 if (i.tm.opcode_modifier.jump == JUMP)
9115 {
9116 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9117 {
9118 *branch_p = align_branch_jmp;
9119 add_padding = align_branch & align_branch_jmp_bit;
9120 }
9121 else
9122 {
9123 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9124 igore the lowest bit. */
9125 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9126 *branch_p = align_branch_jcc;
9127 if ((align_branch & align_branch_jcc_bit))
9128 add_padding = 1;
9129 }
9130 }
9131 else if (is_any_vex_encoding (&i.tm))
9132 return 0;
9133 else if ((i.tm.base_opcode | 1) == 0xc3)
9134 {
9135 /* Near ret. */
9136 *branch_p = align_branch_ret;
9137 if ((align_branch & align_branch_ret_bit))
9138 add_padding = 1;
9139 }
9140 else
9141 {
9142 /* Check for indirect jmp, direct and indirect calls. */
9143 if (i.tm.base_opcode == 0xe8)
9144 {
9145 /* Direct call. */
9146 *branch_p = align_branch_call;
9147 if ((align_branch & align_branch_call_bit))
9148 add_padding = 1;
9149 }
9150 else if (i.tm.base_opcode == 0xff
9151 && (i.tm.extension_opcode == 2
9152 || i.tm.extension_opcode == 4))
9153 {
9154 /* Indirect call and jmp. */
9155 *branch_p = align_branch_indirect;
9156 if ((align_branch & align_branch_indirect_bit))
9157 add_padding = 1;
9158 }
9159
9160 if (add_padding
9161 && i.disp_operands
9162 && tls_get_addr
9163 && (i.op[0].disps->X_op == O_symbol
9164 || (i.op[0].disps->X_op == O_subtract
9165 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9166 {
9167 symbolS *s = i.op[0].disps->X_add_symbol;
9168 /* No padding to call to global or undefined tls_get_addr. */
9169 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9170 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9171 return 0;
9172 }
9173 }
9174
9175 if (add_padding
9176 && last_insn.kind != last_insn_other
9177 && last_insn.seg == now_seg)
9178 {
9179 if (flag_debug)
9180 as_warn_where (last_insn.file, last_insn.line,
9181 _("`%s` skips -malign-branch-boundary on `%s`"),
9182 last_insn.name, i.tm.name);
9183 return 0;
9184 }
9185
9186 return add_padding;
9187 }
9188
9189 static void
9190 output_insn (void)
9191 {
9192 fragS *insn_start_frag;
9193 offsetT insn_start_off;
9194 fragS *fragP = NULL;
9195 enum align_branch_kind branch = align_branch_none;
9196 /* The initializer is arbitrary just to avoid uninitialized error.
9197 it's actually either assigned in add_branch_padding_frag_p
9198 or never be used. */
9199 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9200
9201 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9202 if (IS_ELF && x86_used_note && now_seg != absolute_section)
9203 {
9204 if ((i.xstate & xstate_tmm) == xstate_tmm
9205 || i.tm.cpu_flags.bitfield.cpuamx_tile)
9206 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9207
9208 if (i.tm.cpu_flags.bitfield.cpu8087
9209 || i.tm.cpu_flags.bitfield.cpu287
9210 || i.tm.cpu_flags.bitfield.cpu387
9211 || i.tm.cpu_flags.bitfield.cpu687
9212 || i.tm.cpu_flags.bitfield.cpufisttp)
9213 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9214
9215 if ((i.xstate & xstate_mmx)
9216 || i.tm.base_opcode == 0xf77 /* emms */
9217 || i.tm.base_opcode == 0xf0e /* femms */)
9218 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9219
9220 if (i.index_reg)
9221 {
9222 if (i.index_reg->reg_type.bitfield.zmmword)
9223 i.xstate |= xstate_zmm;
9224 else if (i.index_reg->reg_type.bitfield.ymmword)
9225 i.xstate |= xstate_ymm;
9226 else if (i.index_reg->reg_type.bitfield.xmmword)
9227 i.xstate |= xstate_xmm;
9228 }
9229
9230 /* vzeroall / vzeroupper */
9231 if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9232 i.xstate |= xstate_ymm;
9233
9234 if ((i.xstate & xstate_xmm)
9235 /* ldmxcsr / stmxcsr */
9236 || (i.tm.base_opcode == 0xfae && i.tm.cpu_flags.bitfield.cpusse)
9237 /* vldmxcsr / vstmxcsr */
9238 || (i.tm.base_opcode == 0xae && i.tm.cpu_flags.bitfield.cpuavx)
9239 || i.tm.cpu_flags.bitfield.cpuwidekl
9240 || i.tm.cpu_flags.bitfield.cpukl)
9241 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9242
9243 if ((i.xstate & xstate_ymm) == xstate_ymm)
9244 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9245 if ((i.xstate & xstate_zmm) == xstate_zmm)
9246 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9247 if (i.mask || (i.xstate & xstate_mask) == xstate_mask)
9248 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9249 if (i.tm.cpu_flags.bitfield.cpufxsr)
9250 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9251 if (i.tm.cpu_flags.bitfield.cpuxsave)
9252 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9253 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9254 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9255 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9256 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9257
9258 if (x86_feature_2_used
9259 || i.tm.cpu_flags.bitfield.cpucmov
9260 || i.tm.cpu_flags.bitfield.cpusyscall
9261 || (i.tm.base_opcode == 0xfc7
9262 && i.tm.opcode_modifier.opcodeprefix == 0
9263 && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9264 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9265 if (i.tm.cpu_flags.bitfield.cpusse3
9266 || i.tm.cpu_flags.bitfield.cpussse3
9267 || i.tm.cpu_flags.bitfield.cpusse4_1
9268 || i.tm.cpu_flags.bitfield.cpusse4_2
9269 || i.tm.cpu_flags.bitfield.cpucx16
9270 || i.tm.cpu_flags.bitfield.cpupopcnt
9271 /* LAHF-SAHF insns in 64-bit mode. */
9272 || (flag_code == CODE_64BIT
9273 && (i.tm.base_opcode | 1) == 0x9f))
9274 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9275 if (i.tm.cpu_flags.bitfield.cpuavx
9276 || i.tm.cpu_flags.bitfield.cpuavx2
9277 /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9278 CpuAVX512DQ, LPW, TBM and AMX. */
9279 || (i.tm.opcode_modifier.vex
9280 && !i.tm.cpu_flags.bitfield.cpuavx512f
9281 && !i.tm.cpu_flags.bitfield.cpuavx512bw
9282 && !i.tm.cpu_flags.bitfield.cpuavx512dq
9283 && !i.tm.cpu_flags.bitfield.cpulwp
9284 && !i.tm.cpu_flags.bitfield.cputbm
9285 && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9286 || i.tm.cpu_flags.bitfield.cpuf16c
9287 || i.tm.cpu_flags.bitfield.cpufma
9288 || i.tm.cpu_flags.bitfield.cpulzcnt
9289 || i.tm.cpu_flags.bitfield.cpumovbe
9290 || i.tm.cpu_flags.bitfield.cpuxsaves
9291 || (x86_feature_2_used
9292 & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9293 | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9294 | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9295 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9296 if (i.tm.cpu_flags.bitfield.cpuavx512f
9297 || i.tm.cpu_flags.bitfield.cpuavx512bw
9298 || i.tm.cpu_flags.bitfield.cpuavx512dq
9299 || i.tm.cpu_flags.bitfield.cpuavx512vl
9300 /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9301 VNNIW. */
9302 || (i.tm.opcode_modifier.evex
9303 && !i.tm.cpu_flags.bitfield.cpuavx512er
9304 && !i.tm.cpu_flags.bitfield.cpuavx512pf
9305 && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9306 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9307 }
9308 #endif
9309
9310 /* Tie dwarf2 debug info to the address at the start of the insn.
9311 We can't do this after the insn has been output as the current
9312 frag may have been closed off. eg. by frag_var. */
9313 dwarf2_emit_insn (0);
9314
9315 insn_start_frag = frag_now;
9316 insn_start_off = frag_now_fix ();
9317
9318 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9319 {
9320 char *p;
9321 /* Branch can be 8 bytes. Leave some room for prefixes. */
9322 unsigned int max_branch_padding_size = 14;
9323
9324 /* Align section to boundary. */
9325 record_alignment (now_seg, align_branch_power);
9326
9327 /* Make room for padding. */
9328 frag_grow (max_branch_padding_size);
9329
9330 /* Start of the padding. */
9331 p = frag_more (0);
9332
9333 fragP = frag_now;
9334
9335 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9336 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9337 NULL, 0, p);
9338
9339 fragP->tc_frag_data.mf_type = mf_jcc;
9340 fragP->tc_frag_data.branch_type = branch;
9341 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9342 }
9343
9344 /* Output jumps. */
9345 if (i.tm.opcode_modifier.jump == JUMP)
9346 output_branch ();
9347 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9348 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9349 output_jump ();
9350 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9351 output_interseg_jump ();
9352 else
9353 {
9354 /* Output normal instructions here. */
9355 char *p;
9356 unsigned char *q;
9357 unsigned int j;
9358 enum mf_cmp_kind mf_cmp;
9359
9360 if (avoid_fence
9361 && (i.tm.base_opcode == 0xfaee8
9362 || i.tm.base_opcode == 0xfaef0
9363 || i.tm.base_opcode == 0xfaef8))
9364 {
9365 /* Encode lfence, mfence, and sfence as
9366 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9367 if (now_seg != absolute_section)
9368 {
9369 offsetT val = 0x240483f0ULL;
9370
9371 p = frag_more (5);
9372 md_number_to_chars (p, val, 5);
9373 }
9374 else
9375 abs_section_offset += 5;
9376 return;
9377 }
9378
9379 /* Some processors fail on LOCK prefix. This options makes
9380 assembler ignore LOCK prefix and serves as a workaround. */
9381 if (omit_lock_prefix)
9382 {
9383 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9384 return;
9385 i.prefix[LOCK_PREFIX] = 0;
9386 }
9387
9388 if (branch)
9389 /* Skip if this is a branch. */
9390 ;
9391 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9392 {
9393 /* Make room for padding. */
9394 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9395 p = frag_more (0);
9396
9397 fragP = frag_now;
9398
9399 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9400 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9401 NULL, 0, p);
9402
9403 fragP->tc_frag_data.mf_type = mf_cmp;
9404 fragP->tc_frag_data.branch_type = align_branch_fused;
9405 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9406 }
9407 else if (add_branch_prefix_frag_p ())
9408 {
9409 unsigned int max_prefix_size = align_branch_prefix_size;
9410
9411 /* Make room for padding. */
9412 frag_grow (max_prefix_size);
9413 p = frag_more (0);
9414
9415 fragP = frag_now;
9416
9417 frag_var (rs_machine_dependent, max_prefix_size, 0,
9418 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9419 NULL, 0, p);
9420
9421 fragP->tc_frag_data.max_bytes = max_prefix_size;
9422 }
9423
9424 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9425 don't need the explicit prefix. */
9426 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9427 {
9428 switch (i.tm.opcode_modifier.opcodeprefix)
9429 {
9430 case PREFIX_0X66:
9431 add_prefix (0x66);
9432 break;
9433 case PREFIX_0XF2:
9434 add_prefix (0xf2);
9435 break;
9436 case PREFIX_0XF3:
9437 if (!i.tm.cpu_flags.bitfield.cpupadlock
9438 || (i.prefix[REP_PREFIX] != 0xf3))
9439 add_prefix (0xf3);
9440 break;
9441 case PREFIX_NONE:
9442 switch (i.tm.opcode_length)
9443 {
9444 case 3:
9445 case 2:
9446 case 1:
9447 break;
9448 case 0:
9449 /* Check for pseudo prefixes. */
9450 as_bad_where (insn_start_frag->fr_file,
9451 insn_start_frag->fr_line,
9452 _("pseudo prefix without instruction"));
9453 return;
9454 default:
9455 abort ();
9456 }
9457 break;
9458 default:
9459 abort ();
9460 }
9461
9462 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9463 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9464 R_X86_64_GOTTPOFF relocation so that linker can safely
9465 perform IE->LE optimization. A dummy REX_OPCODE prefix
9466 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9467 relocation for GDesc -> IE/LE optimization. */
9468 if (x86_elf_abi == X86_64_X32_ABI
9469 && i.operands == 2
9470 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9471 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9472 && i.prefix[REX_PREFIX] == 0)
9473 add_prefix (REX_OPCODE);
9474 #endif
9475
9476 /* The prefix bytes. */
9477 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9478 if (*q)
9479 frag_opcode_byte (*q);
9480 }
9481 else
9482 {
9483 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9484 if (*q)
9485 switch (j)
9486 {
9487 case SEG_PREFIX:
9488 case ADDR_PREFIX:
9489 frag_opcode_byte (*q);
9490 break;
9491 default:
9492 /* There should be no other prefixes for instructions
9493 with VEX prefix. */
9494 abort ();
9495 }
9496
9497 /* For EVEX instructions i.vrex should become 0 after
9498 build_evex_prefix. For VEX instructions upper 16 registers
9499 aren't available, so VREX should be 0. */
9500 if (i.vrex)
9501 abort ();
9502 /* Now the VEX prefix. */
9503 if (now_seg != absolute_section)
9504 {
9505 p = frag_more (i.vex.length);
9506 for (j = 0; j < i.vex.length; j++)
9507 p[j] = i.vex.bytes[j];
9508 }
9509 else
9510 abs_section_offset += i.vex.length;
9511 }
9512
9513 /* Now the opcode; be careful about word order here! */
9514 if (now_seg == absolute_section)
9515 abs_section_offset += i.tm.opcode_length;
9516 else if (i.tm.opcode_length == 1)
9517 {
9518 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9519 }
9520 else
9521 {
9522 switch (i.tm.opcode_length)
9523 {
9524 case 4:
9525 p = frag_more (4);
9526 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9527 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9528 break;
9529 case 3:
9530 p = frag_more (3);
9531 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9532 break;
9533 case 2:
9534 p = frag_more (2);
9535 break;
9536 default:
9537 abort ();
9538 break;
9539 }
9540
9541 /* Put out high byte first: can't use md_number_to_chars! */
9542 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9543 *p = i.tm.base_opcode & 0xff;
9544 }
9545
9546 /* Now the modrm byte and sib byte (if present). */
9547 if (i.tm.opcode_modifier.modrm)
9548 {
9549 frag_opcode_byte ((i.rm.regmem << 0)
9550 | (i.rm.reg << 3)
9551 | (i.rm.mode << 6));
9552 /* If i.rm.regmem == ESP (4)
9553 && i.rm.mode != (Register mode)
9554 && not 16 bit
9555 ==> need second modrm byte. */
9556 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9557 && i.rm.mode != 3
9558 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9559 frag_opcode_byte ((i.sib.base << 0)
9560 | (i.sib.index << 3)
9561 | (i.sib.scale << 6));
9562 }
9563
9564 if (i.disp_operands)
9565 output_disp (insn_start_frag, insn_start_off);
9566
9567 if (i.imm_operands)
9568 output_imm (insn_start_frag, insn_start_off);
9569
9570 /*
9571 * frag_now_fix () returning plain abs_section_offset when we're in the
9572 * absolute section, and abs_section_offset not getting updated as data
9573 * gets added to the frag breaks the logic below.
9574 */
9575 if (now_seg != absolute_section)
9576 {
9577 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9578 if (j > 15)
9579 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9580 j);
9581 else if (fragP)
9582 {
9583 /* NB: Don't add prefix with GOTPC relocation since
9584 output_disp() above depends on the fixed encoding
9585 length. Can't add prefix with TLS relocation since
9586 it breaks TLS linker optimization. */
9587 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9588 /* Prefix count on the current instruction. */
9589 unsigned int count = i.vex.length;
9590 unsigned int k;
9591 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9592 /* REX byte is encoded in VEX/EVEX prefix. */
9593 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9594 count++;
9595
9596 /* Count prefixes for extended opcode maps. */
9597 if (!i.vex.length)
9598 switch (i.tm.opcode_length)
9599 {
9600 case 3:
9601 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9602 {
9603 count++;
9604 switch ((i.tm.base_opcode >> 8) & 0xff)
9605 {
9606 case 0x38:
9607 case 0x3a:
9608 count++;
9609 break;
9610 default:
9611 break;
9612 }
9613 }
9614 break;
9615 case 2:
9616 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9617 count++;
9618 break;
9619 case 1:
9620 break;
9621 default:
9622 abort ();
9623 }
9624
9625 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9626 == BRANCH_PREFIX)
9627 {
9628 /* Set the maximum prefix size in BRANCH_PREFIX
9629 frag. */
9630 if (fragP->tc_frag_data.max_bytes > max)
9631 fragP->tc_frag_data.max_bytes = max;
9632 if (fragP->tc_frag_data.max_bytes > count)
9633 fragP->tc_frag_data.max_bytes -= count;
9634 else
9635 fragP->tc_frag_data.max_bytes = 0;
9636 }
9637 else
9638 {
9639 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9640 frag. */
9641 unsigned int max_prefix_size;
9642 if (align_branch_prefix_size > max)
9643 max_prefix_size = max;
9644 else
9645 max_prefix_size = align_branch_prefix_size;
9646 if (max_prefix_size > count)
9647 fragP->tc_frag_data.max_prefix_length
9648 = max_prefix_size - count;
9649 }
9650
9651 /* Use existing segment prefix if possible. Use CS
9652 segment prefix in 64-bit mode. In 32-bit mode, use SS
9653 segment prefix with ESP/EBP base register and use DS
9654 segment prefix without ESP/EBP base register. */
9655 if (i.prefix[SEG_PREFIX])
9656 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9657 else if (flag_code == CODE_64BIT)
9658 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9659 else if (i.base_reg
9660 && (i.base_reg->reg_num == 4
9661 || i.base_reg->reg_num == 5))
9662 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9663 else
9664 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9665 }
9666 }
9667 }
9668
9669 /* NB: Don't work with COND_JUMP86 without i386. */
9670 if (align_branch_power
9671 && now_seg != absolute_section
9672 && cpu_arch_flags.bitfield.cpui386)
9673 {
9674 /* Terminate each frag so that we can add prefix and check for
9675 fused jcc. */
9676 frag_wane (frag_now);
9677 frag_new (0);
9678 }
9679
9680 #ifdef DEBUG386
9681 if (flag_debug)
9682 {
9683 pi ("" /*line*/, &i);
9684 }
9685 #endif /* DEBUG386 */
9686 }
9687
9688 /* Return the size of the displacement operand N. */
9689
9690 static int
9691 disp_size (unsigned int n)
9692 {
9693 int size = 4;
9694
9695 if (i.types[n].bitfield.disp64)
9696 size = 8;
9697 else if (i.types[n].bitfield.disp8)
9698 size = 1;
9699 else if (i.types[n].bitfield.disp16)
9700 size = 2;
9701 return size;
9702 }
9703
9704 /* Return the size of the immediate operand N. */
9705
9706 static int
9707 imm_size (unsigned int n)
9708 {
9709 int size = 4;
9710 if (i.types[n].bitfield.imm64)
9711 size = 8;
9712 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9713 size = 1;
9714 else if (i.types[n].bitfield.imm16)
9715 size = 2;
9716 return size;
9717 }
9718
9719 static void
9720 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9721 {
9722 char *p;
9723 unsigned int n;
9724
9725 for (n = 0; n < i.operands; n++)
9726 {
9727 if (operand_type_check (i.types[n], disp))
9728 {
9729 int size = disp_size (n);
9730
9731 if (now_seg == absolute_section)
9732 abs_section_offset += size;
9733 else if (i.op[n].disps->X_op == O_constant)
9734 {
9735 offsetT val = i.op[n].disps->X_add_number;
9736
9737 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9738 size);
9739 p = frag_more (size);
9740 md_number_to_chars (p, val, size);
9741 }
9742 else
9743 {
9744 enum bfd_reloc_code_real reloc_type;
9745 int sign = i.types[n].bitfield.disp32s;
9746 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9747 fixS *fixP;
9748
9749 /* We can't have 8 bit displacement here. */
9750 gas_assert (!i.types[n].bitfield.disp8);
9751
9752 /* The PC relative address is computed relative
9753 to the instruction boundary, so in case immediate
9754 fields follows, we need to adjust the value. */
9755 if (pcrel && i.imm_operands)
9756 {
9757 unsigned int n1;
9758 int sz = 0;
9759
9760 for (n1 = 0; n1 < i.operands; n1++)
9761 if (operand_type_check (i.types[n1], imm))
9762 {
9763 /* Only one immediate is allowed for PC
9764 relative address. */
9765 gas_assert (sz == 0);
9766 sz = imm_size (n1);
9767 i.op[n].disps->X_add_number -= sz;
9768 }
9769 /* We should find the immediate. */
9770 gas_assert (sz != 0);
9771 }
9772
9773 p = frag_more (size);
9774 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9775 if (GOT_symbol
9776 && GOT_symbol == i.op[n].disps->X_add_symbol
9777 && (((reloc_type == BFD_RELOC_32
9778 || reloc_type == BFD_RELOC_X86_64_32S
9779 || (reloc_type == BFD_RELOC_64
9780 && object_64bit))
9781 && (i.op[n].disps->X_op == O_symbol
9782 || (i.op[n].disps->X_op == O_add
9783 && ((symbol_get_value_expression
9784 (i.op[n].disps->X_op_symbol)->X_op)
9785 == O_subtract))))
9786 || reloc_type == BFD_RELOC_32_PCREL))
9787 {
9788 if (!object_64bit)
9789 {
9790 reloc_type = BFD_RELOC_386_GOTPC;
9791 i.has_gotpc_tls_reloc = TRUE;
9792 i.op[n].imms->X_add_number +=
9793 encoding_length (insn_start_frag, insn_start_off, p);
9794 }
9795 else if (reloc_type == BFD_RELOC_64)
9796 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9797 else
9798 /* Don't do the adjustment for x86-64, as there
9799 the pcrel addressing is relative to the _next_
9800 insn, and that is taken care of in other code. */
9801 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9802 }
9803 else if (align_branch_power)
9804 {
9805 switch (reloc_type)
9806 {
9807 case BFD_RELOC_386_TLS_GD:
9808 case BFD_RELOC_386_TLS_LDM:
9809 case BFD_RELOC_386_TLS_IE:
9810 case BFD_RELOC_386_TLS_IE_32:
9811 case BFD_RELOC_386_TLS_GOTIE:
9812 case BFD_RELOC_386_TLS_GOTDESC:
9813 case BFD_RELOC_386_TLS_DESC_CALL:
9814 case BFD_RELOC_X86_64_TLSGD:
9815 case BFD_RELOC_X86_64_TLSLD:
9816 case BFD_RELOC_X86_64_GOTTPOFF:
9817 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9818 case BFD_RELOC_X86_64_TLSDESC_CALL:
9819 i.has_gotpc_tls_reloc = TRUE;
9820 default:
9821 break;
9822 }
9823 }
9824 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9825 size, i.op[n].disps, pcrel,
9826 reloc_type);
9827 /* Check for "call/jmp *mem", "mov mem, %reg",
9828 "test %reg, mem" and "binop mem, %reg" where binop
9829 is one of adc, add, and, cmp, or, sbb, sub, xor
9830 instructions without data prefix. Always generate
9831 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9832 if (i.prefix[DATA_PREFIX] == 0
9833 && (generate_relax_relocations
9834 || (!object_64bit
9835 && i.rm.mode == 0
9836 && i.rm.regmem == 5))
9837 && (i.rm.mode == 2
9838 || (i.rm.mode == 0 && i.rm.regmem == 5))
9839 && !is_any_vex_encoding(&i.tm)
9840 && ((i.operands == 1
9841 && i.tm.base_opcode == 0xff
9842 && (i.rm.reg == 2 || i.rm.reg == 4))
9843 || (i.operands == 2
9844 && (i.tm.base_opcode == 0x8b
9845 || i.tm.base_opcode == 0x85
9846 || (i.tm.base_opcode & ~0x38) == 0x03))))
9847 {
9848 if (object_64bit)
9849 {
9850 fixP->fx_tcbit = i.rex != 0;
9851 if (i.base_reg
9852 && (i.base_reg->reg_num == RegIP))
9853 fixP->fx_tcbit2 = 1;
9854 }
9855 else
9856 fixP->fx_tcbit2 = 1;
9857 }
9858 }
9859 }
9860 }
9861 }
9862
9863 static void
9864 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9865 {
9866 char *p;
9867 unsigned int n;
9868
9869 for (n = 0; n < i.operands; n++)
9870 {
9871 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9872 if (i.rounding && (int) n == i.rounding->operand)
9873 continue;
9874
9875 if (operand_type_check (i.types[n], imm))
9876 {
9877 int size = imm_size (n);
9878
9879 if (now_seg == absolute_section)
9880 abs_section_offset += size;
9881 else if (i.op[n].imms->X_op == O_constant)
9882 {
9883 offsetT val;
9884
9885 val = offset_in_range (i.op[n].imms->X_add_number,
9886 size);
9887 p = frag_more (size);
9888 md_number_to_chars (p, val, size);
9889 }
9890 else
9891 {
9892 /* Not absolute_section.
9893 Need a 32-bit fixup (don't support 8bit
9894 non-absolute imms). Try to support other
9895 sizes ... */
9896 enum bfd_reloc_code_real reloc_type;
9897 int sign;
9898
9899 if (i.types[n].bitfield.imm32s
9900 && (i.suffix == QWORD_MNEM_SUFFIX
9901 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9902 sign = 1;
9903 else
9904 sign = 0;
9905
9906 p = frag_more (size);
9907 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9908
9909 /* This is tough to explain. We end up with this one if we
9910 * have operands that look like
9911 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9912 * obtain the absolute address of the GOT, and it is strongly
9913 * preferable from a performance point of view to avoid using
9914 * a runtime relocation for this. The actual sequence of
9915 * instructions often look something like:
9916 *
9917 * call .L66
9918 * .L66:
9919 * popl %ebx
9920 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9921 *
9922 * The call and pop essentially return the absolute address
9923 * of the label .L66 and store it in %ebx. The linker itself
9924 * will ultimately change the first operand of the addl so
9925 * that %ebx points to the GOT, but to keep things simple, the
9926 * .o file must have this operand set so that it generates not
9927 * the absolute address of .L66, but the absolute address of
9928 * itself. This allows the linker itself simply treat a GOTPC
9929 * relocation as asking for a pcrel offset to the GOT to be
9930 * added in, and the addend of the relocation is stored in the
9931 * operand field for the instruction itself.
9932 *
9933 * Our job here is to fix the operand so that it would add
9934 * the correct offset so that %ebx would point to itself. The
9935 * thing that is tricky is that .-.L66 will point to the
9936 * beginning of the instruction, so we need to further modify
9937 * the operand so that it will point to itself. There are
9938 * other cases where you have something like:
9939 *
9940 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9941 *
9942 * and here no correction would be required. Internally in
9943 * the assembler we treat operands of this form as not being
9944 * pcrel since the '.' is explicitly mentioned, and I wonder
9945 * whether it would simplify matters to do it this way. Who
9946 * knows. In earlier versions of the PIC patches, the
9947 * pcrel_adjust field was used to store the correction, but
9948 * since the expression is not pcrel, I felt it would be
9949 * confusing to do it this way. */
9950
9951 if ((reloc_type == BFD_RELOC_32
9952 || reloc_type == BFD_RELOC_X86_64_32S
9953 || reloc_type == BFD_RELOC_64)
9954 && GOT_symbol
9955 && GOT_symbol == i.op[n].imms->X_add_symbol
9956 && (i.op[n].imms->X_op == O_symbol
9957 || (i.op[n].imms->X_op == O_add
9958 && ((symbol_get_value_expression
9959 (i.op[n].imms->X_op_symbol)->X_op)
9960 == O_subtract))))
9961 {
9962 if (!object_64bit)
9963 reloc_type = BFD_RELOC_386_GOTPC;
9964 else if (size == 4)
9965 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9966 else if (size == 8)
9967 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9968 i.has_gotpc_tls_reloc = TRUE;
9969 i.op[n].imms->X_add_number +=
9970 encoding_length (insn_start_frag, insn_start_off, p);
9971 }
9972 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9973 i.op[n].imms, 0, reloc_type);
9974 }
9975 }
9976 }
9977 }
9978 \f
9979 /* x86_cons_fix_new is called via the expression parsing code when a
9980 reloc is needed. We use this hook to get the correct .got reloc. */
9981 static int cons_sign = -1;
9982
9983 void
9984 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9985 expressionS *exp, bfd_reloc_code_real_type r)
9986 {
9987 r = reloc (len, 0, cons_sign, r);
9988
9989 #ifdef TE_PE
9990 if (exp->X_op == O_secrel)
9991 {
9992 exp->X_op = O_symbol;
9993 r = BFD_RELOC_32_SECREL;
9994 }
9995 #endif
9996
9997 fix_new_exp (frag, off, len, exp, 0, r);
9998 }
9999
10000 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
10001 purpose of the `.dc.a' internal pseudo-op. */
10002
10003 int
10004 x86_address_bytes (void)
10005 {
10006 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
10007 return 4;
10008 return stdoutput->arch_info->bits_per_address / 8;
10009 }
10010
10011 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
10012 || defined (LEX_AT)
10013 # define lex_got(reloc, adjust, types) NULL
10014 #else
10015 /* Parse operands of the form
10016 <symbol>@GOTOFF+<nnn>
10017 and similar .plt or .got references.
10018
10019 If we find one, set up the correct relocation in RELOC and copy the
10020 input string, minus the `@GOTOFF' into a malloc'd buffer for
10021 parsing by the calling routine. Return this buffer, and if ADJUST
10022 is non-null set it to the length of the string we removed from the
10023 input line. Otherwise return NULL. */
10024 static char *
10025 lex_got (enum bfd_reloc_code_real *rel,
10026 int *adjust,
10027 i386_operand_type *types)
10028 {
10029 /* Some of the relocations depend on the size of what field is to
10030 be relocated. But in our callers i386_immediate and i386_displacement
10031 we don't yet know the operand size (this will be set by insn
10032 matching). Hence we record the word32 relocation here,
10033 and adjust the reloc according to the real size in reloc(). */
10034 static const struct {
10035 const char *str;
10036 int len;
10037 const enum bfd_reloc_code_real rel[2];
10038 const i386_operand_type types64;
10039 bfd_boolean need_GOT_symbol;
10040 } gotrel[] = {
10041 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10042 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
10043 BFD_RELOC_SIZE32 },
10044 OPERAND_TYPE_IMM32_64, FALSE },
10045 #endif
10046 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
10047 BFD_RELOC_X86_64_PLTOFF64 },
10048 OPERAND_TYPE_IMM64, TRUE },
10049 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
10050 BFD_RELOC_X86_64_PLT32 },
10051 OPERAND_TYPE_IMM32_32S_DISP32, FALSE },
10052 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
10053 BFD_RELOC_X86_64_GOTPLT64 },
10054 OPERAND_TYPE_IMM64_DISP64, TRUE },
10055 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
10056 BFD_RELOC_X86_64_GOTOFF64 },
10057 OPERAND_TYPE_IMM64_DISP64, TRUE },
10058 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10059 BFD_RELOC_X86_64_GOTPCREL },
10060 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10061 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
10062 BFD_RELOC_X86_64_TLSGD },
10063 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10064 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
10065 _dummy_first_bfd_reloc_code_real },
10066 OPERAND_TYPE_NONE, TRUE },
10067 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
10068 BFD_RELOC_X86_64_TLSLD },
10069 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10070 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10071 BFD_RELOC_X86_64_GOTTPOFF },
10072 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10073 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
10074 BFD_RELOC_X86_64_TPOFF32 },
10075 OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10076 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
10077 _dummy_first_bfd_reloc_code_real },
10078 OPERAND_TYPE_NONE, TRUE },
10079 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
10080 BFD_RELOC_X86_64_DTPOFF32 },
10081 OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10082 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10083 _dummy_first_bfd_reloc_code_real },
10084 OPERAND_TYPE_NONE, TRUE },
10085 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10086 _dummy_first_bfd_reloc_code_real },
10087 OPERAND_TYPE_NONE, TRUE },
10088 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
10089 BFD_RELOC_X86_64_GOT32 },
10090 OPERAND_TYPE_IMM32_32S_64_DISP32, TRUE },
10091 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
10092 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10093 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10094 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
10095 BFD_RELOC_X86_64_TLSDESC_CALL },
10096 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10097 };
10098 char *cp;
10099 unsigned int j;
10100
10101 #if defined (OBJ_MAYBE_ELF)
10102 if (!IS_ELF)
10103 return NULL;
10104 #endif
10105
10106 for (cp = input_line_pointer; *cp != '@'; cp++)
10107 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10108 return NULL;
10109
10110 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10111 {
10112 int len = gotrel[j].len;
10113 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10114 {
10115 if (gotrel[j].rel[object_64bit] != 0)
10116 {
10117 int first, second;
10118 char *tmpbuf, *past_reloc;
10119
10120 *rel = gotrel[j].rel[object_64bit];
10121
10122 if (types)
10123 {
10124 if (flag_code != CODE_64BIT)
10125 {
10126 types->bitfield.imm32 = 1;
10127 types->bitfield.disp32 = 1;
10128 }
10129 else
10130 *types = gotrel[j].types64;
10131 }
10132
10133 if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10134 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10135
10136 /* The length of the first part of our input line. */
10137 first = cp - input_line_pointer;
10138
10139 /* The second part goes from after the reloc token until
10140 (and including) an end_of_line char or comma. */
10141 past_reloc = cp + 1 + len;
10142 cp = past_reloc;
10143 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10144 ++cp;
10145 second = cp + 1 - past_reloc;
10146
10147 /* Allocate and copy string. The trailing NUL shouldn't
10148 be necessary, but be safe. */
10149 tmpbuf = XNEWVEC (char, first + second + 2);
10150 memcpy (tmpbuf, input_line_pointer, first);
10151 if (second != 0 && *past_reloc != ' ')
10152 /* Replace the relocation token with ' ', so that
10153 errors like foo@GOTOFF1 will be detected. */
10154 tmpbuf[first++] = ' ';
10155 else
10156 /* Increment length by 1 if the relocation token is
10157 removed. */
10158 len++;
10159 if (adjust)
10160 *adjust = len;
10161 memcpy (tmpbuf + first, past_reloc, second);
10162 tmpbuf[first + second] = '\0';
10163 return tmpbuf;
10164 }
10165
10166 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10167 gotrel[j].str, 1 << (5 + object_64bit));
10168 return NULL;
10169 }
10170 }
10171
10172 /* Might be a symbol version string. Don't as_bad here. */
10173 return NULL;
10174 }
10175 #endif
10176
10177 #ifdef TE_PE
10178 #ifdef lex_got
10179 #undef lex_got
10180 #endif
10181 /* Parse operands of the form
10182 <symbol>@SECREL32+<nnn>
10183
10184 If we find one, set up the correct relocation in RELOC and copy the
10185 input string, minus the `@SECREL32' into a malloc'd buffer for
10186 parsing by the calling routine. Return this buffer, and if ADJUST
10187 is non-null set it to the length of the string we removed from the
10188 input line. Otherwise return NULL.
10189
10190 This function is copied from the ELF version above adjusted for PE targets. */
10191
10192 static char *
10193 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10194 int *adjust ATTRIBUTE_UNUSED,
10195 i386_operand_type *types)
10196 {
10197 static const struct
10198 {
10199 const char *str;
10200 int len;
10201 const enum bfd_reloc_code_real rel[2];
10202 const i386_operand_type types64;
10203 }
10204 gotrel[] =
10205 {
10206 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10207 BFD_RELOC_32_SECREL },
10208 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10209 };
10210
10211 char *cp;
10212 unsigned j;
10213
10214 for (cp = input_line_pointer; *cp != '@'; cp++)
10215 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10216 return NULL;
10217
10218 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10219 {
10220 int len = gotrel[j].len;
10221
10222 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10223 {
10224 if (gotrel[j].rel[object_64bit] != 0)
10225 {
10226 int first, second;
10227 char *tmpbuf, *past_reloc;
10228
10229 *rel = gotrel[j].rel[object_64bit];
10230 if (adjust)
10231 *adjust = len;
10232
10233 if (types)
10234 {
10235 if (flag_code != CODE_64BIT)
10236 {
10237 types->bitfield.imm32 = 1;
10238 types->bitfield.disp32 = 1;
10239 }
10240 else
10241 *types = gotrel[j].types64;
10242 }
10243
10244 /* The length of the first part of our input line. */
10245 first = cp - input_line_pointer;
10246
10247 /* The second part goes from after the reloc token until
10248 (and including) an end_of_line char or comma. */
10249 past_reloc = cp + 1 + len;
10250 cp = past_reloc;
10251 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10252 ++cp;
10253 second = cp + 1 - past_reloc;
10254
10255 /* Allocate and copy string. The trailing NUL shouldn't
10256 be necessary, but be safe. */
10257 tmpbuf = XNEWVEC (char, first + second + 2);
10258 memcpy (tmpbuf, input_line_pointer, first);
10259 if (second != 0 && *past_reloc != ' ')
10260 /* Replace the relocation token with ' ', so that
10261 errors like foo@SECLREL321 will be detected. */
10262 tmpbuf[first++] = ' ';
10263 memcpy (tmpbuf + first, past_reloc, second);
10264 tmpbuf[first + second] = '\0';
10265 return tmpbuf;
10266 }
10267
10268 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10269 gotrel[j].str, 1 << (5 + object_64bit));
10270 return NULL;
10271 }
10272 }
10273
10274 /* Might be a symbol version string. Don't as_bad here. */
10275 return NULL;
10276 }
10277
10278 #endif /* TE_PE */
10279
10280 bfd_reloc_code_real_type
10281 x86_cons (expressionS *exp, int size)
10282 {
10283 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10284
10285 intel_syntax = -intel_syntax;
10286
10287 exp->X_md = 0;
10288 if (size == 4 || (object_64bit && size == 8))
10289 {
10290 /* Handle @GOTOFF and the like in an expression. */
10291 char *save;
10292 char *gotfree_input_line;
10293 int adjust = 0;
10294
10295 save = input_line_pointer;
10296 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10297 if (gotfree_input_line)
10298 input_line_pointer = gotfree_input_line;
10299
10300 expression (exp);
10301
10302 if (gotfree_input_line)
10303 {
10304 /* expression () has merrily parsed up to the end of line,
10305 or a comma - in the wrong buffer. Transfer how far
10306 input_line_pointer has moved to the right buffer. */
10307 input_line_pointer = (save
10308 + (input_line_pointer - gotfree_input_line)
10309 + adjust);
10310 free (gotfree_input_line);
10311 if (exp->X_op == O_constant
10312 || exp->X_op == O_absent
10313 || exp->X_op == O_illegal
10314 || exp->X_op == O_register
10315 || exp->X_op == O_big)
10316 {
10317 char c = *input_line_pointer;
10318 *input_line_pointer = 0;
10319 as_bad (_("missing or invalid expression `%s'"), save);
10320 *input_line_pointer = c;
10321 }
10322 else if ((got_reloc == BFD_RELOC_386_PLT32
10323 || got_reloc == BFD_RELOC_X86_64_PLT32)
10324 && exp->X_op != O_symbol)
10325 {
10326 char c = *input_line_pointer;
10327 *input_line_pointer = 0;
10328 as_bad (_("invalid PLT expression `%s'"), save);
10329 *input_line_pointer = c;
10330 }
10331 }
10332 }
10333 else
10334 expression (exp);
10335
10336 intel_syntax = -intel_syntax;
10337
10338 if (intel_syntax)
10339 i386_intel_simplify (exp);
10340
10341 return got_reloc;
10342 }
10343
10344 static void
10345 signed_cons (int size)
10346 {
10347 if (flag_code == CODE_64BIT)
10348 cons_sign = 1;
10349 cons (size);
10350 cons_sign = -1;
10351 }
10352
10353 #ifdef TE_PE
10354 static void
10355 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10356 {
10357 expressionS exp;
10358
10359 do
10360 {
10361 expression (&exp);
10362 if (exp.X_op == O_symbol)
10363 exp.X_op = O_secrel;
10364
10365 emit_expr (&exp, 4);
10366 }
10367 while (*input_line_pointer++ == ',');
10368
10369 input_line_pointer--;
10370 demand_empty_rest_of_line ();
10371 }
10372 #endif
10373
10374 /* Handle Vector operations. */
10375
10376 static char *
10377 check_VecOperations (char *op_string, char *op_end)
10378 {
10379 const reg_entry *mask;
10380 const char *saved;
10381 char *end_op;
10382
10383 while (*op_string
10384 && (op_end == NULL || op_string < op_end))
10385 {
10386 saved = op_string;
10387 if (*op_string == '{')
10388 {
10389 op_string++;
10390
10391 /* Check broadcasts. */
10392 if (strncmp (op_string, "1to", 3) == 0)
10393 {
10394 int bcst_type;
10395
10396 if (i.broadcast)
10397 goto duplicated_vec_op;
10398
10399 op_string += 3;
10400 if (*op_string == '8')
10401 bcst_type = 8;
10402 else if (*op_string == '4')
10403 bcst_type = 4;
10404 else if (*op_string == '2')
10405 bcst_type = 2;
10406 else if (*op_string == '1'
10407 && *(op_string+1) == '6')
10408 {
10409 bcst_type = 16;
10410 op_string++;
10411 }
10412 else
10413 {
10414 as_bad (_("Unsupported broadcast: `%s'"), saved);
10415 return NULL;
10416 }
10417 op_string++;
10418
10419 broadcast_op.type = bcst_type;
10420 broadcast_op.operand = this_operand;
10421 broadcast_op.bytes = 0;
10422 i.broadcast = &broadcast_op;
10423 }
10424 /* Check masking operation. */
10425 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10426 {
10427 if (mask == &bad_reg)
10428 return NULL;
10429
10430 /* k0 can't be used for write mask. */
10431 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10432 {
10433 as_bad (_("`%s%s' can't be used for write mask"),
10434 register_prefix, mask->reg_name);
10435 return NULL;
10436 }
10437
10438 if (!i.mask)
10439 {
10440 mask_op.mask = mask;
10441 mask_op.zeroing = 0;
10442 mask_op.operand = this_operand;
10443 i.mask = &mask_op;
10444 }
10445 else
10446 {
10447 if (i.mask->mask)
10448 goto duplicated_vec_op;
10449
10450 i.mask->mask = mask;
10451
10452 /* Only "{z}" is allowed here. No need to check
10453 zeroing mask explicitly. */
10454 if (i.mask->operand != this_operand)
10455 {
10456 as_bad (_("invalid write mask `%s'"), saved);
10457 return NULL;
10458 }
10459 }
10460
10461 op_string = end_op;
10462 }
10463 /* Check zeroing-flag for masking operation. */
10464 else if (*op_string == 'z')
10465 {
10466 if (!i.mask)
10467 {
10468 mask_op.mask = NULL;
10469 mask_op.zeroing = 1;
10470 mask_op.operand = this_operand;
10471 i.mask = &mask_op;
10472 }
10473 else
10474 {
10475 if (i.mask->zeroing)
10476 {
10477 duplicated_vec_op:
10478 as_bad (_("duplicated `%s'"), saved);
10479 return NULL;
10480 }
10481
10482 i.mask->zeroing = 1;
10483
10484 /* Only "{%k}" is allowed here. No need to check mask
10485 register explicitly. */
10486 if (i.mask->operand != this_operand)
10487 {
10488 as_bad (_("invalid zeroing-masking `%s'"),
10489 saved);
10490 return NULL;
10491 }
10492 }
10493
10494 op_string++;
10495 }
10496 else
10497 goto unknown_vec_op;
10498
10499 if (*op_string != '}')
10500 {
10501 as_bad (_("missing `}' in `%s'"), saved);
10502 return NULL;
10503 }
10504 op_string++;
10505
10506 /* Strip whitespace since the addition of pseudo prefixes
10507 changed how the scrubber treats '{'. */
10508 if (is_space_char (*op_string))
10509 ++op_string;
10510
10511 continue;
10512 }
10513 unknown_vec_op:
10514 /* We don't know this one. */
10515 as_bad (_("unknown vector operation: `%s'"), saved);
10516 return NULL;
10517 }
10518
10519 if (i.mask && i.mask->zeroing && !i.mask->mask)
10520 {
10521 as_bad (_("zeroing-masking only allowed with write mask"));
10522 return NULL;
10523 }
10524
10525 return op_string;
10526 }
10527
10528 static int
10529 i386_immediate (char *imm_start)
10530 {
10531 char *save_input_line_pointer;
10532 char *gotfree_input_line;
10533 segT exp_seg = 0;
10534 expressionS *exp;
10535 i386_operand_type types;
10536
10537 operand_type_set (&types, ~0);
10538
10539 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10540 {
10541 as_bad (_("at most %d immediate operands are allowed"),
10542 MAX_IMMEDIATE_OPERANDS);
10543 return 0;
10544 }
10545
10546 exp = &im_expressions[i.imm_operands++];
10547 i.op[this_operand].imms = exp;
10548
10549 if (is_space_char (*imm_start))
10550 ++imm_start;
10551
10552 save_input_line_pointer = input_line_pointer;
10553 input_line_pointer = imm_start;
10554
10555 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10556 if (gotfree_input_line)
10557 input_line_pointer = gotfree_input_line;
10558
10559 exp_seg = expression (exp);
10560
10561 SKIP_WHITESPACE ();
10562
10563 /* Handle vector operations. */
10564 if (*input_line_pointer == '{')
10565 {
10566 input_line_pointer = check_VecOperations (input_line_pointer,
10567 NULL);
10568 if (input_line_pointer == NULL)
10569 return 0;
10570 }
10571
10572 if (*input_line_pointer)
10573 as_bad (_("junk `%s' after expression"), input_line_pointer);
10574
10575 input_line_pointer = save_input_line_pointer;
10576 if (gotfree_input_line)
10577 {
10578 free (gotfree_input_line);
10579
10580 if (exp->X_op == O_constant || exp->X_op == O_register)
10581 exp->X_op = O_illegal;
10582 }
10583
10584 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10585 }
10586
10587 static int
10588 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10589 i386_operand_type types, const char *imm_start)
10590 {
10591 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10592 {
10593 if (imm_start)
10594 as_bad (_("missing or invalid immediate expression `%s'"),
10595 imm_start);
10596 return 0;
10597 }
10598 else if (exp->X_op == O_constant)
10599 {
10600 /* Size it properly later. */
10601 i.types[this_operand].bitfield.imm64 = 1;
10602 /* If not 64bit, sign extend val. */
10603 if (flag_code != CODE_64BIT
10604 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10605 exp->X_add_number
10606 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10607 }
10608 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10609 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10610 && exp_seg != absolute_section
10611 && exp_seg != text_section
10612 && exp_seg != data_section
10613 && exp_seg != bss_section
10614 && exp_seg != undefined_section
10615 && !bfd_is_com_section (exp_seg))
10616 {
10617 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10618 return 0;
10619 }
10620 #endif
10621 else if (!intel_syntax && exp_seg == reg_section)
10622 {
10623 if (imm_start)
10624 as_bad (_("illegal immediate register operand %s"), imm_start);
10625 return 0;
10626 }
10627 else
10628 {
10629 /* This is an address. The size of the address will be
10630 determined later, depending on destination register,
10631 suffix, or the default for the section. */
10632 i.types[this_operand].bitfield.imm8 = 1;
10633 i.types[this_operand].bitfield.imm16 = 1;
10634 i.types[this_operand].bitfield.imm32 = 1;
10635 i.types[this_operand].bitfield.imm32s = 1;
10636 i.types[this_operand].bitfield.imm64 = 1;
10637 i.types[this_operand] = operand_type_and (i.types[this_operand],
10638 types);
10639 }
10640
10641 return 1;
10642 }
10643
10644 static char *
10645 i386_scale (char *scale)
10646 {
10647 offsetT val;
10648 char *save = input_line_pointer;
10649
10650 input_line_pointer = scale;
10651 val = get_absolute_expression ();
10652
10653 switch (val)
10654 {
10655 case 1:
10656 i.log2_scale_factor = 0;
10657 break;
10658 case 2:
10659 i.log2_scale_factor = 1;
10660 break;
10661 case 4:
10662 i.log2_scale_factor = 2;
10663 break;
10664 case 8:
10665 i.log2_scale_factor = 3;
10666 break;
10667 default:
10668 {
10669 char sep = *input_line_pointer;
10670
10671 *input_line_pointer = '\0';
10672 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10673 scale);
10674 *input_line_pointer = sep;
10675 input_line_pointer = save;
10676 return NULL;
10677 }
10678 }
10679 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10680 {
10681 as_warn (_("scale factor of %d without an index register"),
10682 1 << i.log2_scale_factor);
10683 i.log2_scale_factor = 0;
10684 }
10685 scale = input_line_pointer;
10686 input_line_pointer = save;
10687 return scale;
10688 }
10689
10690 static int
10691 i386_displacement (char *disp_start, char *disp_end)
10692 {
10693 expressionS *exp;
10694 segT exp_seg = 0;
10695 char *save_input_line_pointer;
10696 char *gotfree_input_line;
10697 int override;
10698 i386_operand_type bigdisp, types = anydisp;
10699 int ret;
10700
10701 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10702 {
10703 as_bad (_("at most %d displacement operands are allowed"),
10704 MAX_MEMORY_OPERANDS);
10705 return 0;
10706 }
10707
10708 operand_type_set (&bigdisp, 0);
10709 if (i.jumpabsolute
10710 || i.types[this_operand].bitfield.baseindex
10711 || (current_templates->start->opcode_modifier.jump != JUMP
10712 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10713 {
10714 i386_addressing_mode ();
10715 override = (i.prefix[ADDR_PREFIX] != 0);
10716 if (flag_code == CODE_64BIT)
10717 {
10718 if (!override)
10719 {
10720 bigdisp.bitfield.disp32s = 1;
10721 bigdisp.bitfield.disp64 = 1;
10722 }
10723 else
10724 bigdisp.bitfield.disp32 = 1;
10725 }
10726 else if ((flag_code == CODE_16BIT) ^ override)
10727 bigdisp.bitfield.disp16 = 1;
10728 else
10729 bigdisp.bitfield.disp32 = 1;
10730 }
10731 else
10732 {
10733 /* For PC-relative branches, the width of the displacement may be
10734 dependent upon data size, but is never dependent upon address size.
10735 Also make sure to not unintentionally match against a non-PC-relative
10736 branch template. */
10737 static templates aux_templates;
10738 const insn_template *t = current_templates->start;
10739 bfd_boolean has_intel64 = FALSE;
10740
10741 aux_templates.start = t;
10742 while (++t < current_templates->end)
10743 {
10744 if (t->opcode_modifier.jump
10745 != current_templates->start->opcode_modifier.jump)
10746 break;
10747 if ((t->opcode_modifier.isa64 >= INTEL64))
10748 has_intel64 = TRUE;
10749 }
10750 if (t < current_templates->end)
10751 {
10752 aux_templates.end = t;
10753 current_templates = &aux_templates;
10754 }
10755
10756 override = (i.prefix[DATA_PREFIX] != 0);
10757 if (flag_code == CODE_64BIT)
10758 {
10759 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10760 && (!intel64 || !has_intel64))
10761 bigdisp.bitfield.disp16 = 1;
10762 else
10763 bigdisp.bitfield.disp32s = 1;
10764 }
10765 else
10766 {
10767 if (!override)
10768 override = (i.suffix == (flag_code != CODE_16BIT
10769 ? WORD_MNEM_SUFFIX
10770 : LONG_MNEM_SUFFIX));
10771 bigdisp.bitfield.disp32 = 1;
10772 if ((flag_code == CODE_16BIT) ^ override)
10773 {
10774 bigdisp.bitfield.disp32 = 0;
10775 bigdisp.bitfield.disp16 = 1;
10776 }
10777 }
10778 }
10779 i.types[this_operand] = operand_type_or (i.types[this_operand],
10780 bigdisp);
10781
10782 exp = &disp_expressions[i.disp_operands];
10783 i.op[this_operand].disps = exp;
10784 i.disp_operands++;
10785 save_input_line_pointer = input_line_pointer;
10786 input_line_pointer = disp_start;
10787 END_STRING_AND_SAVE (disp_end);
10788
10789 #ifndef GCC_ASM_O_HACK
10790 #define GCC_ASM_O_HACK 0
10791 #endif
10792 #if GCC_ASM_O_HACK
10793 END_STRING_AND_SAVE (disp_end + 1);
10794 if (i.types[this_operand].bitfield.baseIndex
10795 && displacement_string_end[-1] == '+')
10796 {
10797 /* This hack is to avoid a warning when using the "o"
10798 constraint within gcc asm statements.
10799 For instance:
10800
10801 #define _set_tssldt_desc(n,addr,limit,type) \
10802 __asm__ __volatile__ ( \
10803 "movw %w2,%0\n\t" \
10804 "movw %w1,2+%0\n\t" \
10805 "rorl $16,%1\n\t" \
10806 "movb %b1,4+%0\n\t" \
10807 "movb %4,5+%0\n\t" \
10808 "movb $0,6+%0\n\t" \
10809 "movb %h1,7+%0\n\t" \
10810 "rorl $16,%1" \
10811 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10812
10813 This works great except that the output assembler ends
10814 up looking a bit weird if it turns out that there is
10815 no offset. You end up producing code that looks like:
10816
10817 #APP
10818 movw $235,(%eax)
10819 movw %dx,2+(%eax)
10820 rorl $16,%edx
10821 movb %dl,4+(%eax)
10822 movb $137,5+(%eax)
10823 movb $0,6+(%eax)
10824 movb %dh,7+(%eax)
10825 rorl $16,%edx
10826 #NO_APP
10827
10828 So here we provide the missing zero. */
10829
10830 *displacement_string_end = '0';
10831 }
10832 #endif
10833 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10834 if (gotfree_input_line)
10835 input_line_pointer = gotfree_input_line;
10836
10837 exp_seg = expression (exp);
10838
10839 SKIP_WHITESPACE ();
10840 if (*input_line_pointer)
10841 as_bad (_("junk `%s' after expression"), input_line_pointer);
10842 #if GCC_ASM_O_HACK
10843 RESTORE_END_STRING (disp_end + 1);
10844 #endif
10845 input_line_pointer = save_input_line_pointer;
10846 if (gotfree_input_line)
10847 {
10848 free (gotfree_input_line);
10849
10850 if (exp->X_op == O_constant || exp->X_op == O_register)
10851 exp->X_op = O_illegal;
10852 }
10853
10854 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10855
10856 RESTORE_END_STRING (disp_end);
10857
10858 return ret;
10859 }
10860
10861 static int
10862 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10863 i386_operand_type types, const char *disp_start)
10864 {
10865 i386_operand_type bigdisp;
10866 int ret = 1;
10867
10868 /* We do this to make sure that the section symbol is in
10869 the symbol table. We will ultimately change the relocation
10870 to be relative to the beginning of the section. */
10871 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10872 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10873 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10874 {
10875 if (exp->X_op != O_symbol)
10876 goto inv_disp;
10877
10878 if (S_IS_LOCAL (exp->X_add_symbol)
10879 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10880 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10881 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10882 exp->X_op = O_subtract;
10883 exp->X_op_symbol = GOT_symbol;
10884 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10885 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10886 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10887 i.reloc[this_operand] = BFD_RELOC_64;
10888 else
10889 i.reloc[this_operand] = BFD_RELOC_32;
10890 }
10891
10892 else if (exp->X_op == O_absent
10893 || exp->X_op == O_illegal
10894 || exp->X_op == O_big)
10895 {
10896 inv_disp:
10897 as_bad (_("missing or invalid displacement expression `%s'"),
10898 disp_start);
10899 ret = 0;
10900 }
10901
10902 else if (flag_code == CODE_64BIT
10903 && !i.prefix[ADDR_PREFIX]
10904 && exp->X_op == O_constant)
10905 {
10906 /* Since displacement is signed extended to 64bit, don't allow
10907 disp32 and turn off disp32s if they are out of range. */
10908 i.types[this_operand].bitfield.disp32 = 0;
10909 if (!fits_in_signed_long (exp->X_add_number))
10910 {
10911 i.types[this_operand].bitfield.disp32s = 0;
10912 if (i.types[this_operand].bitfield.baseindex)
10913 {
10914 as_bad (_("0x%lx out range of signed 32bit displacement"),
10915 (long) exp->X_add_number);
10916 ret = 0;
10917 }
10918 }
10919 }
10920
10921 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10922 else if (exp->X_op != O_constant
10923 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10924 && exp_seg != absolute_section
10925 && exp_seg != text_section
10926 && exp_seg != data_section
10927 && exp_seg != bss_section
10928 && exp_seg != undefined_section
10929 && !bfd_is_com_section (exp_seg))
10930 {
10931 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10932 ret = 0;
10933 }
10934 #endif
10935
10936 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10937 /* Constants get taken care of by optimize_disp(). */
10938 && exp->X_op != O_constant)
10939 i.types[this_operand].bitfield.disp8 = 1;
10940
10941 /* Check if this is a displacement only operand. */
10942 bigdisp = i.types[this_operand];
10943 bigdisp.bitfield.disp8 = 0;
10944 bigdisp.bitfield.disp16 = 0;
10945 bigdisp.bitfield.disp32 = 0;
10946 bigdisp.bitfield.disp32s = 0;
10947 bigdisp.bitfield.disp64 = 0;
10948 if (operand_type_all_zero (&bigdisp))
10949 i.types[this_operand] = operand_type_and (i.types[this_operand],
10950 types);
10951
10952 return ret;
10953 }
10954
10955 /* Return the active addressing mode, taking address override and
10956 registers forming the address into consideration. Update the
10957 address override prefix if necessary. */
10958
10959 static enum flag_code
10960 i386_addressing_mode (void)
10961 {
10962 enum flag_code addr_mode;
10963
10964 if (i.prefix[ADDR_PREFIX])
10965 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10966 else if (flag_code == CODE_16BIT
10967 && current_templates->start->cpu_flags.bitfield.cpumpx
10968 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10969 from md_assemble() by "is not a valid base/index expression"
10970 when there is a base and/or index. */
10971 && !i.types[this_operand].bitfield.baseindex)
10972 {
10973 /* MPX insn memory operands with neither base nor index must be forced
10974 to use 32-bit addressing in 16-bit mode. */
10975 addr_mode = CODE_32BIT;
10976 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10977 ++i.prefixes;
10978 gas_assert (!i.types[this_operand].bitfield.disp16);
10979 gas_assert (!i.types[this_operand].bitfield.disp32);
10980 }
10981 else
10982 {
10983 addr_mode = flag_code;
10984
10985 #if INFER_ADDR_PREFIX
10986 if (i.mem_operands == 0)
10987 {
10988 /* Infer address prefix from the first memory operand. */
10989 const reg_entry *addr_reg = i.base_reg;
10990
10991 if (addr_reg == NULL)
10992 addr_reg = i.index_reg;
10993
10994 if (addr_reg)
10995 {
10996 if (addr_reg->reg_type.bitfield.dword)
10997 addr_mode = CODE_32BIT;
10998 else if (flag_code != CODE_64BIT
10999 && addr_reg->reg_type.bitfield.word)
11000 addr_mode = CODE_16BIT;
11001
11002 if (addr_mode != flag_code)
11003 {
11004 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11005 i.prefixes += 1;
11006 /* Change the size of any displacement too. At most one
11007 of Disp16 or Disp32 is set.
11008 FIXME. There doesn't seem to be any real need for
11009 separate Disp16 and Disp32 flags. The same goes for
11010 Imm16 and Imm32. Removing them would probably clean
11011 up the code quite a lot. */
11012 if (flag_code != CODE_64BIT
11013 && (i.types[this_operand].bitfield.disp16
11014 || i.types[this_operand].bitfield.disp32))
11015 i.types[this_operand]
11016 = operand_type_xor (i.types[this_operand], disp16_32);
11017 }
11018 }
11019 }
11020 #endif
11021 }
11022
11023 return addr_mode;
11024 }
11025
11026 /* Make sure the memory operand we've been dealt is valid.
11027 Return 1 on success, 0 on a failure. */
11028
11029 static int
11030 i386_index_check (const char *operand_string)
11031 {
11032 const char *kind = "base/index";
11033 enum flag_code addr_mode = i386_addressing_mode ();
11034
11035 if (current_templates->start->opcode_modifier.isstring
11036 && !current_templates->start->cpu_flags.bitfield.cpupadlock
11037 && (current_templates->end[-1].opcode_modifier.isstring
11038 || i.mem_operands))
11039 {
11040 /* Memory operands of string insns are special in that they only allow
11041 a single register (rDI, rSI, or rBX) as their memory address. */
11042 const reg_entry *expected_reg;
11043 static const char *di_si[][2] =
11044 {
11045 { "esi", "edi" },
11046 { "si", "di" },
11047 { "rsi", "rdi" }
11048 };
11049 static const char *bx[] = { "ebx", "bx", "rbx" };
11050
11051 kind = "string address";
11052
11053 if (current_templates->start->opcode_modifier.prefixok == PrefixRep)
11054 {
11055 int es_op = current_templates->end[-1].opcode_modifier.isstring
11056 - IS_STRING_ES_OP0;
11057 int op = 0;
11058
11059 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11060 || ((!i.mem_operands != !intel_syntax)
11061 && current_templates->end[-1].operand_types[1]
11062 .bitfield.baseindex))
11063 op = 1;
11064 expected_reg
11065 = (const reg_entry *) str_hash_find (reg_hash,
11066 di_si[addr_mode][op == es_op]);
11067 }
11068 else
11069 expected_reg
11070 = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11071
11072 if (i.base_reg != expected_reg
11073 || i.index_reg
11074 || operand_type_check (i.types[this_operand], disp))
11075 {
11076 /* The second memory operand must have the same size as
11077 the first one. */
11078 if (i.mem_operands
11079 && i.base_reg
11080 && !((addr_mode == CODE_64BIT
11081 && i.base_reg->reg_type.bitfield.qword)
11082 || (addr_mode == CODE_32BIT
11083 ? i.base_reg->reg_type.bitfield.dword
11084 : i.base_reg->reg_type.bitfield.word)))
11085 goto bad_address;
11086
11087 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11088 operand_string,
11089 intel_syntax ? '[' : '(',
11090 register_prefix,
11091 expected_reg->reg_name,
11092 intel_syntax ? ']' : ')');
11093 return 1;
11094 }
11095 else
11096 return 1;
11097
11098 bad_address:
11099 as_bad (_("`%s' is not a valid %s expression"),
11100 operand_string, kind);
11101 return 0;
11102 }
11103 else
11104 {
11105 if (addr_mode != CODE_16BIT)
11106 {
11107 /* 32-bit/64-bit checks. */
11108 if (i.disp_encoding == disp_encoding_16bit)
11109 {
11110 bad_disp:
11111 as_bad (_("invalid `%s' prefix"),
11112 addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11113 return 0;
11114 }
11115
11116 if ((i.base_reg
11117 && ((addr_mode == CODE_64BIT
11118 ? !i.base_reg->reg_type.bitfield.qword
11119 : !i.base_reg->reg_type.bitfield.dword)
11120 || (i.index_reg && i.base_reg->reg_num == RegIP)
11121 || i.base_reg->reg_num == RegIZ))
11122 || (i.index_reg
11123 && !i.index_reg->reg_type.bitfield.xmmword
11124 && !i.index_reg->reg_type.bitfield.ymmword
11125 && !i.index_reg->reg_type.bitfield.zmmword
11126 && ((addr_mode == CODE_64BIT
11127 ? !i.index_reg->reg_type.bitfield.qword
11128 : !i.index_reg->reg_type.bitfield.dword)
11129 || !i.index_reg->reg_type.bitfield.baseindex)))
11130 goto bad_address;
11131
11132 /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11133 if (current_templates->start->base_opcode == 0xf30f1b
11134 || (current_templates->start->base_opcode & ~1) == 0x0f1a
11135 || current_templates->start->opcode_modifier.sib == SIBMEM)
11136 {
11137 /* They cannot use RIP-relative addressing. */
11138 if (i.base_reg && i.base_reg->reg_num == RegIP)
11139 {
11140 as_bad (_("`%s' cannot be used here"), operand_string);
11141 return 0;
11142 }
11143
11144 /* bndldx and bndstx ignore their scale factor. */
11145 if ((current_templates->start->base_opcode & ~1) == 0x0f1a
11146 && i.log2_scale_factor)
11147 as_warn (_("register scaling is being ignored here"));
11148 }
11149 }
11150 else
11151 {
11152 /* 16-bit checks. */
11153 if (i.disp_encoding == disp_encoding_32bit)
11154 goto bad_disp;
11155
11156 if ((i.base_reg
11157 && (!i.base_reg->reg_type.bitfield.word
11158 || !i.base_reg->reg_type.bitfield.baseindex))
11159 || (i.index_reg
11160 && (!i.index_reg->reg_type.bitfield.word
11161 || !i.index_reg->reg_type.bitfield.baseindex
11162 || !(i.base_reg
11163 && i.base_reg->reg_num < 6
11164 && i.index_reg->reg_num >= 6
11165 && i.log2_scale_factor == 0))))
11166 goto bad_address;
11167 }
11168 }
11169 return 1;
11170 }
11171
11172 /* Handle vector immediates. */
11173
11174 static int
11175 RC_SAE_immediate (const char *imm_start)
11176 {
11177 unsigned int match_found, j;
11178 const char *pstr = imm_start;
11179 expressionS *exp;
11180
11181 if (*pstr != '{')
11182 return 0;
11183
11184 pstr++;
11185 match_found = 0;
11186 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11187 {
11188 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11189 {
11190 if (!i.rounding)
11191 {
11192 rc_op.type = RC_NamesTable[j].type;
11193 rc_op.operand = this_operand;
11194 i.rounding = &rc_op;
11195 }
11196 else
11197 {
11198 as_bad (_("duplicated `%s'"), imm_start);
11199 return 0;
11200 }
11201 pstr += RC_NamesTable[j].len;
11202 match_found = 1;
11203 break;
11204 }
11205 }
11206 if (!match_found)
11207 return 0;
11208
11209 if (*pstr++ != '}')
11210 {
11211 as_bad (_("Missing '}': '%s'"), imm_start);
11212 return 0;
11213 }
11214 /* RC/SAE immediate string should contain nothing more. */;
11215 if (*pstr != 0)
11216 {
11217 as_bad (_("Junk after '}': '%s'"), imm_start);
11218 return 0;
11219 }
11220
11221 exp = &im_expressions[i.imm_operands++];
11222 i.op[this_operand].imms = exp;
11223
11224 exp->X_op = O_constant;
11225 exp->X_add_number = 0;
11226 exp->X_add_symbol = (symbolS *) 0;
11227 exp->X_op_symbol = (symbolS *) 0;
11228
11229 i.types[this_operand].bitfield.imm8 = 1;
11230 return 1;
11231 }
11232
11233 /* Only string instructions can have a second memory operand, so
11234 reduce current_templates to just those if it contains any. */
11235 static int
11236 maybe_adjust_templates (void)
11237 {
11238 const insn_template *t;
11239
11240 gas_assert (i.mem_operands == 1);
11241
11242 for (t = current_templates->start; t < current_templates->end; ++t)
11243 if (t->opcode_modifier.isstring)
11244 break;
11245
11246 if (t < current_templates->end)
11247 {
11248 static templates aux_templates;
11249 bfd_boolean recheck;
11250
11251 aux_templates.start = t;
11252 for (; t < current_templates->end; ++t)
11253 if (!t->opcode_modifier.isstring)
11254 break;
11255 aux_templates.end = t;
11256
11257 /* Determine whether to re-check the first memory operand. */
11258 recheck = (aux_templates.start != current_templates->start
11259 || t != current_templates->end);
11260
11261 current_templates = &aux_templates;
11262
11263 if (recheck)
11264 {
11265 i.mem_operands = 0;
11266 if (i.memop1_string != NULL
11267 && i386_index_check (i.memop1_string) == 0)
11268 return 0;
11269 i.mem_operands = 1;
11270 }
11271 }
11272
11273 return 1;
11274 }
11275
11276 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11277 on error. */
11278
11279 static int
11280 i386_att_operand (char *operand_string)
11281 {
11282 const reg_entry *r;
11283 char *end_op;
11284 char *op_string = operand_string;
11285
11286 if (is_space_char (*op_string))
11287 ++op_string;
11288
11289 /* We check for an absolute prefix (differentiating,
11290 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11291 if (*op_string == ABSOLUTE_PREFIX)
11292 {
11293 ++op_string;
11294 if (is_space_char (*op_string))
11295 ++op_string;
11296 i.jumpabsolute = TRUE;
11297 }
11298
11299 /* Check if operand is a register. */
11300 if ((r = parse_register (op_string, &end_op)) != NULL)
11301 {
11302 i386_operand_type temp;
11303
11304 if (r == &bad_reg)
11305 return 0;
11306
11307 /* Check for a segment override by searching for ':' after a
11308 segment register. */
11309 op_string = end_op;
11310 if (is_space_char (*op_string))
11311 ++op_string;
11312 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11313 {
11314 switch (r->reg_num)
11315 {
11316 case 0:
11317 i.seg[i.mem_operands] = &es;
11318 break;
11319 case 1:
11320 i.seg[i.mem_operands] = &cs;
11321 break;
11322 case 2:
11323 i.seg[i.mem_operands] = &ss;
11324 break;
11325 case 3:
11326 i.seg[i.mem_operands] = &ds;
11327 break;
11328 case 4:
11329 i.seg[i.mem_operands] = &fs;
11330 break;
11331 case 5:
11332 i.seg[i.mem_operands] = &gs;
11333 break;
11334 }
11335
11336 /* Skip the ':' and whitespace. */
11337 ++op_string;
11338 if (is_space_char (*op_string))
11339 ++op_string;
11340
11341 if (!is_digit_char (*op_string)
11342 && !is_identifier_char (*op_string)
11343 && *op_string != '('
11344 && *op_string != ABSOLUTE_PREFIX)
11345 {
11346 as_bad (_("bad memory operand `%s'"), op_string);
11347 return 0;
11348 }
11349 /* Handle case of %es:*foo. */
11350 if (*op_string == ABSOLUTE_PREFIX)
11351 {
11352 ++op_string;
11353 if (is_space_char (*op_string))
11354 ++op_string;
11355 i.jumpabsolute = TRUE;
11356 }
11357 goto do_memory_reference;
11358 }
11359
11360 /* Handle vector operations. */
11361 if (*op_string == '{')
11362 {
11363 op_string = check_VecOperations (op_string, NULL);
11364 if (op_string == NULL)
11365 return 0;
11366 }
11367
11368 if (*op_string)
11369 {
11370 as_bad (_("junk `%s' after register"), op_string);
11371 return 0;
11372 }
11373 temp = r->reg_type;
11374 temp.bitfield.baseindex = 0;
11375 i.types[this_operand] = operand_type_or (i.types[this_operand],
11376 temp);
11377 i.types[this_operand].bitfield.unspecified = 0;
11378 i.op[this_operand].regs = r;
11379 i.reg_operands++;
11380 }
11381 else if (*op_string == REGISTER_PREFIX)
11382 {
11383 as_bad (_("bad register name `%s'"), op_string);
11384 return 0;
11385 }
11386 else if (*op_string == IMMEDIATE_PREFIX)
11387 {
11388 ++op_string;
11389 if (i.jumpabsolute)
11390 {
11391 as_bad (_("immediate operand illegal with absolute jump"));
11392 return 0;
11393 }
11394 if (!i386_immediate (op_string))
11395 return 0;
11396 }
11397 else if (RC_SAE_immediate (operand_string))
11398 {
11399 /* If it is a RC or SAE immediate, do nothing. */
11400 ;
11401 }
11402 else if (is_digit_char (*op_string)
11403 || is_identifier_char (*op_string)
11404 || *op_string == '"'
11405 || *op_string == '(')
11406 {
11407 /* This is a memory reference of some sort. */
11408 char *base_string;
11409
11410 /* Start and end of displacement string expression (if found). */
11411 char *displacement_string_start;
11412 char *displacement_string_end;
11413 char *vop_start;
11414
11415 do_memory_reference:
11416 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11417 return 0;
11418 if ((i.mem_operands == 1
11419 && !current_templates->start->opcode_modifier.isstring)
11420 || i.mem_operands == 2)
11421 {
11422 as_bad (_("too many memory references for `%s'"),
11423 current_templates->start->name);
11424 return 0;
11425 }
11426
11427 /* Check for base index form. We detect the base index form by
11428 looking for an ')' at the end of the operand, searching
11429 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11430 after the '('. */
11431 base_string = op_string + strlen (op_string);
11432
11433 /* Handle vector operations. */
11434 vop_start = strchr (op_string, '{');
11435 if (vop_start && vop_start < base_string)
11436 {
11437 if (check_VecOperations (vop_start, base_string) == NULL)
11438 return 0;
11439 base_string = vop_start;
11440 }
11441
11442 --base_string;
11443 if (is_space_char (*base_string))
11444 --base_string;
11445
11446 /* If we only have a displacement, set-up for it to be parsed later. */
11447 displacement_string_start = op_string;
11448 displacement_string_end = base_string + 1;
11449
11450 if (*base_string == ')')
11451 {
11452 char *temp_string;
11453 unsigned int parens_balanced = 1;
11454 /* We've already checked that the number of left & right ()'s are
11455 equal, so this loop will not be infinite. */
11456 do
11457 {
11458 base_string--;
11459 if (*base_string == ')')
11460 parens_balanced++;
11461 if (*base_string == '(')
11462 parens_balanced--;
11463 }
11464 while (parens_balanced);
11465
11466 temp_string = base_string;
11467
11468 /* Skip past '(' and whitespace. */
11469 ++base_string;
11470 if (is_space_char (*base_string))
11471 ++base_string;
11472
11473 if (*base_string == ','
11474 || ((i.base_reg = parse_register (base_string, &end_op))
11475 != NULL))
11476 {
11477 displacement_string_end = temp_string;
11478
11479 i.types[this_operand].bitfield.baseindex = 1;
11480
11481 if (i.base_reg)
11482 {
11483 if (i.base_reg == &bad_reg)
11484 return 0;
11485 base_string = end_op;
11486 if (is_space_char (*base_string))
11487 ++base_string;
11488 }
11489
11490 /* There may be an index reg or scale factor here. */
11491 if (*base_string == ',')
11492 {
11493 ++base_string;
11494 if (is_space_char (*base_string))
11495 ++base_string;
11496
11497 if ((i.index_reg = parse_register (base_string, &end_op))
11498 != NULL)
11499 {
11500 if (i.index_reg == &bad_reg)
11501 return 0;
11502 base_string = end_op;
11503 if (is_space_char (*base_string))
11504 ++base_string;
11505 if (*base_string == ',')
11506 {
11507 ++base_string;
11508 if (is_space_char (*base_string))
11509 ++base_string;
11510 }
11511 else if (*base_string != ')')
11512 {
11513 as_bad (_("expecting `,' or `)' "
11514 "after index register in `%s'"),
11515 operand_string);
11516 return 0;
11517 }
11518 }
11519 else if (*base_string == REGISTER_PREFIX)
11520 {
11521 end_op = strchr (base_string, ',');
11522 if (end_op)
11523 *end_op = '\0';
11524 as_bad (_("bad register name `%s'"), base_string);
11525 return 0;
11526 }
11527
11528 /* Check for scale factor. */
11529 if (*base_string != ')')
11530 {
11531 char *end_scale = i386_scale (base_string);
11532
11533 if (!end_scale)
11534 return 0;
11535
11536 base_string = end_scale;
11537 if (is_space_char (*base_string))
11538 ++base_string;
11539 if (*base_string != ')')
11540 {
11541 as_bad (_("expecting `)' "
11542 "after scale factor in `%s'"),
11543 operand_string);
11544 return 0;
11545 }
11546 }
11547 else if (!i.index_reg)
11548 {
11549 as_bad (_("expecting index register or scale factor "
11550 "after `,'; got '%c'"),
11551 *base_string);
11552 return 0;
11553 }
11554 }
11555 else if (*base_string != ')')
11556 {
11557 as_bad (_("expecting `,' or `)' "
11558 "after base register in `%s'"),
11559 operand_string);
11560 return 0;
11561 }
11562 }
11563 else if (*base_string == REGISTER_PREFIX)
11564 {
11565 end_op = strchr (base_string, ',');
11566 if (end_op)
11567 *end_op = '\0';
11568 as_bad (_("bad register name `%s'"), base_string);
11569 return 0;
11570 }
11571 }
11572
11573 /* If there's an expression beginning the operand, parse it,
11574 assuming displacement_string_start and
11575 displacement_string_end are meaningful. */
11576 if (displacement_string_start != displacement_string_end)
11577 {
11578 if (!i386_displacement (displacement_string_start,
11579 displacement_string_end))
11580 return 0;
11581 }
11582
11583 /* Special case for (%dx) while doing input/output op. */
11584 if (i.base_reg
11585 && i.base_reg->reg_type.bitfield.instance == RegD
11586 && i.base_reg->reg_type.bitfield.word
11587 && i.index_reg == 0
11588 && i.log2_scale_factor == 0
11589 && i.seg[i.mem_operands] == 0
11590 && !operand_type_check (i.types[this_operand], disp))
11591 {
11592 i.types[this_operand] = i.base_reg->reg_type;
11593 return 1;
11594 }
11595
11596 if (i386_index_check (operand_string) == 0)
11597 return 0;
11598 i.flags[this_operand] |= Operand_Mem;
11599 if (i.mem_operands == 0)
11600 i.memop1_string = xstrdup (operand_string);
11601 i.mem_operands++;
11602 }
11603 else
11604 {
11605 /* It's not a memory operand; argh! */
11606 as_bad (_("invalid char %s beginning operand %d `%s'"),
11607 output_invalid (*op_string),
11608 this_operand + 1,
11609 op_string);
11610 return 0;
11611 }
11612 return 1; /* Normal return. */
11613 }
11614 \f
11615 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11616 that an rs_machine_dependent frag may reach. */
11617
11618 unsigned int
11619 i386_frag_max_var (fragS *frag)
11620 {
11621 /* The only relaxable frags are for jumps.
11622 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11623 gas_assert (frag->fr_type == rs_machine_dependent);
11624 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11625 }
11626
11627 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11628 static int
11629 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11630 {
11631 /* STT_GNU_IFUNC symbol must go through PLT. */
11632 if ((symbol_get_bfdsym (fr_symbol)->flags
11633 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11634 return 0;
11635
11636 if (!S_IS_EXTERNAL (fr_symbol))
11637 /* Symbol may be weak or local. */
11638 return !S_IS_WEAK (fr_symbol);
11639
11640 /* Global symbols with non-default visibility can't be preempted. */
11641 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11642 return 1;
11643
11644 if (fr_var != NO_RELOC)
11645 switch ((enum bfd_reloc_code_real) fr_var)
11646 {
11647 case BFD_RELOC_386_PLT32:
11648 case BFD_RELOC_X86_64_PLT32:
11649 /* Symbol with PLT relocation may be preempted. */
11650 return 0;
11651 default:
11652 abort ();
11653 }
11654
11655 /* Global symbols with default visibility in a shared library may be
11656 preempted by another definition. */
11657 return !shared;
11658 }
11659 #endif
11660
11661 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11662 Note also work for Skylake and Cascadelake.
11663 ---------------------------------------------------------------------
11664 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11665 | ------ | ----------- | ------- | -------- |
11666 | Jo | N | N | Y |
11667 | Jno | N | N | Y |
11668 | Jc/Jb | Y | N | Y |
11669 | Jae/Jnb | Y | N | Y |
11670 | Je/Jz | Y | Y | Y |
11671 | Jne/Jnz | Y | Y | Y |
11672 | Jna/Jbe | Y | N | Y |
11673 | Ja/Jnbe | Y | N | Y |
11674 | Js | N | N | Y |
11675 | Jns | N | N | Y |
11676 | Jp/Jpe | N | N | Y |
11677 | Jnp/Jpo | N | N | Y |
11678 | Jl/Jnge | Y | Y | Y |
11679 | Jge/Jnl | Y | Y | Y |
11680 | Jle/Jng | Y | Y | Y |
11681 | Jg/Jnle | Y | Y | Y |
11682 --------------------------------------------------------------------- */
11683 static int
11684 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11685 {
11686 if (mf_cmp == mf_cmp_alu_cmp)
11687 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11688 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11689 if (mf_cmp == mf_cmp_incdec)
11690 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11691 || mf_jcc == mf_jcc_jle);
11692 if (mf_cmp == mf_cmp_test_and)
11693 return 1;
11694 return 0;
11695 }
11696
11697 /* Return the next non-empty frag. */
11698
11699 static fragS *
11700 i386_next_non_empty_frag (fragS *fragP)
11701 {
11702 /* There may be a frag with a ".fill 0" when there is no room in
11703 the current frag for frag_grow in output_insn. */
11704 for (fragP = fragP->fr_next;
11705 (fragP != NULL
11706 && fragP->fr_type == rs_fill
11707 && fragP->fr_fix == 0);
11708 fragP = fragP->fr_next)
11709 ;
11710 return fragP;
11711 }
11712
11713 /* Return the next jcc frag after BRANCH_PADDING. */
11714
11715 static fragS *
11716 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11717 {
11718 fragS *branch_fragP;
11719 if (!pad_fragP)
11720 return NULL;
11721
11722 if (pad_fragP->fr_type == rs_machine_dependent
11723 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11724 == BRANCH_PADDING))
11725 {
11726 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11727 if (branch_fragP->fr_type != rs_machine_dependent)
11728 return NULL;
11729 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11730 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11731 pad_fragP->tc_frag_data.mf_type))
11732 return branch_fragP;
11733 }
11734
11735 return NULL;
11736 }
11737
11738 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11739
11740 static void
11741 i386_classify_machine_dependent_frag (fragS *fragP)
11742 {
11743 fragS *cmp_fragP;
11744 fragS *pad_fragP;
11745 fragS *branch_fragP;
11746 fragS *next_fragP;
11747 unsigned int max_prefix_length;
11748
11749 if (fragP->tc_frag_data.classified)
11750 return;
11751
11752 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11753 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11754 for (next_fragP = fragP;
11755 next_fragP != NULL;
11756 next_fragP = next_fragP->fr_next)
11757 {
11758 next_fragP->tc_frag_data.classified = 1;
11759 if (next_fragP->fr_type == rs_machine_dependent)
11760 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11761 {
11762 case BRANCH_PADDING:
11763 /* The BRANCH_PADDING frag must be followed by a branch
11764 frag. */
11765 branch_fragP = i386_next_non_empty_frag (next_fragP);
11766 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11767 break;
11768 case FUSED_JCC_PADDING:
11769 /* Check if this is a fused jcc:
11770 FUSED_JCC_PADDING
11771 CMP like instruction
11772 BRANCH_PADDING
11773 COND_JUMP
11774 */
11775 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11776 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11777 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11778 if (branch_fragP)
11779 {
11780 /* The BRANCH_PADDING frag is merged with the
11781 FUSED_JCC_PADDING frag. */
11782 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11783 /* CMP like instruction size. */
11784 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11785 frag_wane (pad_fragP);
11786 /* Skip to branch_fragP. */
11787 next_fragP = branch_fragP;
11788 }
11789 else if (next_fragP->tc_frag_data.max_prefix_length)
11790 {
11791 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11792 a fused jcc. */
11793 next_fragP->fr_subtype
11794 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11795 next_fragP->tc_frag_data.max_bytes
11796 = next_fragP->tc_frag_data.max_prefix_length;
11797 /* This will be updated in the BRANCH_PREFIX scan. */
11798 next_fragP->tc_frag_data.max_prefix_length = 0;
11799 }
11800 else
11801 frag_wane (next_fragP);
11802 break;
11803 }
11804 }
11805
11806 /* Stop if there is no BRANCH_PREFIX. */
11807 if (!align_branch_prefix_size)
11808 return;
11809
11810 /* Scan for BRANCH_PREFIX. */
11811 for (; fragP != NULL; fragP = fragP->fr_next)
11812 {
11813 if (fragP->fr_type != rs_machine_dependent
11814 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11815 != BRANCH_PREFIX))
11816 continue;
11817
11818 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11819 COND_JUMP_PREFIX. */
11820 max_prefix_length = 0;
11821 for (next_fragP = fragP;
11822 next_fragP != NULL;
11823 next_fragP = next_fragP->fr_next)
11824 {
11825 if (next_fragP->fr_type == rs_fill)
11826 /* Skip rs_fill frags. */
11827 continue;
11828 else if (next_fragP->fr_type != rs_machine_dependent)
11829 /* Stop for all other frags. */
11830 break;
11831
11832 /* rs_machine_dependent frags. */
11833 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11834 == BRANCH_PREFIX)
11835 {
11836 /* Count BRANCH_PREFIX frags. */
11837 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11838 {
11839 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11840 frag_wane (next_fragP);
11841 }
11842 else
11843 max_prefix_length
11844 += next_fragP->tc_frag_data.max_bytes;
11845 }
11846 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11847 == BRANCH_PADDING)
11848 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11849 == FUSED_JCC_PADDING))
11850 {
11851 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11852 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11853 break;
11854 }
11855 else
11856 /* Stop for other rs_machine_dependent frags. */
11857 break;
11858 }
11859
11860 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11861
11862 /* Skip to the next frag. */
11863 fragP = next_fragP;
11864 }
11865 }
11866
11867 /* Compute padding size for
11868
11869 FUSED_JCC_PADDING
11870 CMP like instruction
11871 BRANCH_PADDING
11872 COND_JUMP/UNCOND_JUMP
11873
11874 or
11875
11876 BRANCH_PADDING
11877 COND_JUMP/UNCOND_JUMP
11878 */
11879
11880 static int
11881 i386_branch_padding_size (fragS *fragP, offsetT address)
11882 {
11883 unsigned int offset, size, padding_size;
11884 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11885
11886 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11887 if (!address)
11888 address = fragP->fr_address;
11889 address += fragP->fr_fix;
11890
11891 /* CMP like instrunction size. */
11892 size = fragP->tc_frag_data.cmp_size;
11893
11894 /* The base size of the branch frag. */
11895 size += branch_fragP->fr_fix;
11896
11897 /* Add opcode and displacement bytes for the rs_machine_dependent
11898 branch frag. */
11899 if (branch_fragP->fr_type == rs_machine_dependent)
11900 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11901
11902 /* Check if branch is within boundary and doesn't end at the last
11903 byte. */
11904 offset = address & ((1U << align_branch_power) - 1);
11905 if ((offset + size) >= (1U << align_branch_power))
11906 /* Padding needed to avoid crossing boundary. */
11907 padding_size = (1U << align_branch_power) - offset;
11908 else
11909 /* No padding needed. */
11910 padding_size = 0;
11911
11912 /* The return value may be saved in tc_frag_data.length which is
11913 unsigned byte. */
11914 if (!fits_in_unsigned_byte (padding_size))
11915 abort ();
11916
11917 return padding_size;
11918 }
11919
11920 /* i386_generic_table_relax_frag()
11921
11922 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11923 grow/shrink padding to align branch frags. Hand others to
11924 relax_frag(). */
11925
11926 long
11927 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11928 {
11929 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11930 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11931 {
11932 long padding_size = i386_branch_padding_size (fragP, 0);
11933 long grow = padding_size - fragP->tc_frag_data.length;
11934
11935 /* When the BRANCH_PREFIX frag is used, the computed address
11936 must match the actual address and there should be no padding. */
11937 if (fragP->tc_frag_data.padding_address
11938 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11939 || padding_size))
11940 abort ();
11941
11942 /* Update the padding size. */
11943 if (grow)
11944 fragP->tc_frag_data.length = padding_size;
11945
11946 return grow;
11947 }
11948 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11949 {
11950 fragS *padding_fragP, *next_fragP;
11951 long padding_size, left_size, last_size;
11952
11953 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11954 if (!padding_fragP)
11955 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11956 return (fragP->tc_frag_data.length
11957 - fragP->tc_frag_data.last_length);
11958
11959 /* Compute the relative address of the padding frag in the very
11960 first time where the BRANCH_PREFIX frag sizes are zero. */
11961 if (!fragP->tc_frag_data.padding_address)
11962 fragP->tc_frag_data.padding_address
11963 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11964
11965 /* First update the last length from the previous interation. */
11966 left_size = fragP->tc_frag_data.prefix_length;
11967 for (next_fragP = fragP;
11968 next_fragP != padding_fragP;
11969 next_fragP = next_fragP->fr_next)
11970 if (next_fragP->fr_type == rs_machine_dependent
11971 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11972 == BRANCH_PREFIX))
11973 {
11974 if (left_size)
11975 {
11976 int max = next_fragP->tc_frag_data.max_bytes;
11977 if (max)
11978 {
11979 int size;
11980 if (max > left_size)
11981 size = left_size;
11982 else
11983 size = max;
11984 left_size -= size;
11985 next_fragP->tc_frag_data.last_length = size;
11986 }
11987 }
11988 else
11989 next_fragP->tc_frag_data.last_length = 0;
11990 }
11991
11992 /* Check the padding size for the padding frag. */
11993 padding_size = i386_branch_padding_size
11994 (padding_fragP, (fragP->fr_address
11995 + fragP->tc_frag_data.padding_address));
11996
11997 last_size = fragP->tc_frag_data.prefix_length;
11998 /* Check if there is change from the last interation. */
11999 if (padding_size == last_size)
12000 {
12001 /* Update the expected address of the padding frag. */
12002 padding_fragP->tc_frag_data.padding_address
12003 = (fragP->fr_address + padding_size
12004 + fragP->tc_frag_data.padding_address);
12005 return 0;
12006 }
12007
12008 if (padding_size > fragP->tc_frag_data.max_prefix_length)
12009 {
12010 /* No padding if there is no sufficient room. Clear the
12011 expected address of the padding frag. */
12012 padding_fragP->tc_frag_data.padding_address = 0;
12013 padding_size = 0;
12014 }
12015 else
12016 /* Store the expected address of the padding frag. */
12017 padding_fragP->tc_frag_data.padding_address
12018 = (fragP->fr_address + padding_size
12019 + fragP->tc_frag_data.padding_address);
12020
12021 fragP->tc_frag_data.prefix_length = padding_size;
12022
12023 /* Update the length for the current interation. */
12024 left_size = padding_size;
12025 for (next_fragP = fragP;
12026 next_fragP != padding_fragP;
12027 next_fragP = next_fragP->fr_next)
12028 if (next_fragP->fr_type == rs_machine_dependent
12029 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12030 == BRANCH_PREFIX))
12031 {
12032 if (left_size)
12033 {
12034 int max = next_fragP->tc_frag_data.max_bytes;
12035 if (max)
12036 {
12037 int size;
12038 if (max > left_size)
12039 size = left_size;
12040 else
12041 size = max;
12042 left_size -= size;
12043 next_fragP->tc_frag_data.length = size;
12044 }
12045 }
12046 else
12047 next_fragP->tc_frag_data.length = 0;
12048 }
12049
12050 return (fragP->tc_frag_data.length
12051 - fragP->tc_frag_data.last_length);
12052 }
12053 return relax_frag (segment, fragP, stretch);
12054 }
12055
12056 /* md_estimate_size_before_relax()
12057
12058 Called just before relax() for rs_machine_dependent frags. The x86
12059 assembler uses these frags to handle variable size jump
12060 instructions.
12061
12062 Any symbol that is now undefined will not become defined.
12063 Return the correct fr_subtype in the frag.
12064 Return the initial "guess for variable size of frag" to caller.
12065 The guess is actually the growth beyond the fixed part. Whatever
12066 we do to grow the fixed or variable part contributes to our
12067 returned value. */
12068
12069 int
12070 md_estimate_size_before_relax (fragS *fragP, segT segment)
12071 {
12072 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12073 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12074 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12075 {
12076 i386_classify_machine_dependent_frag (fragP);
12077 return fragP->tc_frag_data.length;
12078 }
12079
12080 /* We've already got fragP->fr_subtype right; all we have to do is
12081 check for un-relaxable symbols. On an ELF system, we can't relax
12082 an externally visible symbol, because it may be overridden by a
12083 shared library. */
12084 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12085 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12086 || (IS_ELF
12087 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12088 fragP->fr_var))
12089 #endif
12090 #if defined (OBJ_COFF) && defined (TE_PE)
12091 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12092 && S_IS_WEAK (fragP->fr_symbol))
12093 #endif
12094 )
12095 {
12096 /* Symbol is undefined in this segment, or we need to keep a
12097 reloc so that weak symbols can be overridden. */
12098 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12099 enum bfd_reloc_code_real reloc_type;
12100 unsigned char *opcode;
12101 int old_fr_fix;
12102
12103 if (fragP->fr_var != NO_RELOC)
12104 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12105 else if (size == 2)
12106 reloc_type = BFD_RELOC_16_PCREL;
12107 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12108 else if (need_plt32_p (fragP->fr_symbol))
12109 reloc_type = BFD_RELOC_X86_64_PLT32;
12110 #endif
12111 else
12112 reloc_type = BFD_RELOC_32_PCREL;
12113
12114 old_fr_fix = fragP->fr_fix;
12115 opcode = (unsigned char *) fragP->fr_opcode;
12116
12117 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12118 {
12119 case UNCOND_JUMP:
12120 /* Make jmp (0xeb) a (d)word displacement jump. */
12121 opcode[0] = 0xe9;
12122 fragP->fr_fix += size;
12123 fix_new (fragP, old_fr_fix, size,
12124 fragP->fr_symbol,
12125 fragP->fr_offset, 1,
12126 reloc_type);
12127 break;
12128
12129 case COND_JUMP86:
12130 if (size == 2
12131 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12132 {
12133 /* Negate the condition, and branch past an
12134 unconditional jump. */
12135 opcode[0] ^= 1;
12136 opcode[1] = 3;
12137 /* Insert an unconditional jump. */
12138 opcode[2] = 0xe9;
12139 /* We added two extra opcode bytes, and have a two byte
12140 offset. */
12141 fragP->fr_fix += 2 + 2;
12142 fix_new (fragP, old_fr_fix + 2, 2,
12143 fragP->fr_symbol,
12144 fragP->fr_offset, 1,
12145 reloc_type);
12146 break;
12147 }
12148 /* Fall through. */
12149
12150 case COND_JUMP:
12151 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12152 {
12153 fixS *fixP;
12154
12155 fragP->fr_fix += 1;
12156 fixP = fix_new (fragP, old_fr_fix, 1,
12157 fragP->fr_symbol,
12158 fragP->fr_offset, 1,
12159 BFD_RELOC_8_PCREL);
12160 fixP->fx_signed = 1;
12161 break;
12162 }
12163
12164 /* This changes the byte-displacement jump 0x7N
12165 to the (d)word-displacement jump 0x0f,0x8N. */
12166 opcode[1] = opcode[0] + 0x10;
12167 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12168 /* We've added an opcode byte. */
12169 fragP->fr_fix += 1 + size;
12170 fix_new (fragP, old_fr_fix + 1, size,
12171 fragP->fr_symbol,
12172 fragP->fr_offset, 1,
12173 reloc_type);
12174 break;
12175
12176 default:
12177 BAD_CASE (fragP->fr_subtype);
12178 break;
12179 }
12180 frag_wane (fragP);
12181 return fragP->fr_fix - old_fr_fix;
12182 }
12183
12184 /* Guess size depending on current relax state. Initially the relax
12185 state will correspond to a short jump and we return 1, because
12186 the variable part of the frag (the branch offset) is one byte
12187 long. However, we can relax a section more than once and in that
12188 case we must either set fr_subtype back to the unrelaxed state,
12189 or return the value for the appropriate branch. */
12190 return md_relax_table[fragP->fr_subtype].rlx_length;
12191 }
12192
12193 /* Called after relax() is finished.
12194
12195 In: Address of frag.
12196 fr_type == rs_machine_dependent.
12197 fr_subtype is what the address relaxed to.
12198
12199 Out: Any fixSs and constants are set up.
12200 Caller will turn frag into a ".space 0". */
12201
12202 void
12203 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12204 fragS *fragP)
12205 {
12206 unsigned char *opcode;
12207 unsigned char *where_to_put_displacement = NULL;
12208 offsetT target_address;
12209 offsetT opcode_address;
12210 unsigned int extension = 0;
12211 offsetT displacement_from_opcode_start;
12212
12213 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12214 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12215 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12216 {
12217 /* Generate nop padding. */
12218 unsigned int size = fragP->tc_frag_data.length;
12219 if (size)
12220 {
12221 if (size > fragP->tc_frag_data.max_bytes)
12222 abort ();
12223
12224 if (flag_debug)
12225 {
12226 const char *msg;
12227 const char *branch = "branch";
12228 const char *prefix = "";
12229 fragS *padding_fragP;
12230 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12231 == BRANCH_PREFIX)
12232 {
12233 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12234 switch (fragP->tc_frag_data.default_prefix)
12235 {
12236 default:
12237 abort ();
12238 break;
12239 case CS_PREFIX_OPCODE:
12240 prefix = " cs";
12241 break;
12242 case DS_PREFIX_OPCODE:
12243 prefix = " ds";
12244 break;
12245 case ES_PREFIX_OPCODE:
12246 prefix = " es";
12247 break;
12248 case FS_PREFIX_OPCODE:
12249 prefix = " fs";
12250 break;
12251 case GS_PREFIX_OPCODE:
12252 prefix = " gs";
12253 break;
12254 case SS_PREFIX_OPCODE:
12255 prefix = " ss";
12256 break;
12257 }
12258 if (padding_fragP)
12259 msg = _("%s:%u: add %d%s at 0x%llx to align "
12260 "%s within %d-byte boundary\n");
12261 else
12262 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12263 "align %s within %d-byte boundary\n");
12264 }
12265 else
12266 {
12267 padding_fragP = fragP;
12268 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12269 "%s within %d-byte boundary\n");
12270 }
12271
12272 if (padding_fragP)
12273 switch (padding_fragP->tc_frag_data.branch_type)
12274 {
12275 case align_branch_jcc:
12276 branch = "jcc";
12277 break;
12278 case align_branch_fused:
12279 branch = "fused jcc";
12280 break;
12281 case align_branch_jmp:
12282 branch = "jmp";
12283 break;
12284 case align_branch_call:
12285 branch = "call";
12286 break;
12287 case align_branch_indirect:
12288 branch = "indiret branch";
12289 break;
12290 case align_branch_ret:
12291 branch = "ret";
12292 break;
12293 default:
12294 break;
12295 }
12296
12297 fprintf (stdout, msg,
12298 fragP->fr_file, fragP->fr_line, size, prefix,
12299 (long long) fragP->fr_address, branch,
12300 1 << align_branch_power);
12301 }
12302 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12303 memset (fragP->fr_opcode,
12304 fragP->tc_frag_data.default_prefix, size);
12305 else
12306 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12307 size, 0);
12308 fragP->fr_fix += size;
12309 }
12310 return;
12311 }
12312
12313 opcode = (unsigned char *) fragP->fr_opcode;
12314
12315 /* Address we want to reach in file space. */
12316 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12317
12318 /* Address opcode resides at in file space. */
12319 opcode_address = fragP->fr_address + fragP->fr_fix;
12320
12321 /* Displacement from opcode start to fill into instruction. */
12322 displacement_from_opcode_start = target_address - opcode_address;
12323
12324 if ((fragP->fr_subtype & BIG) == 0)
12325 {
12326 /* Don't have to change opcode. */
12327 extension = 1; /* 1 opcode + 1 displacement */
12328 where_to_put_displacement = &opcode[1];
12329 }
12330 else
12331 {
12332 if (no_cond_jump_promotion
12333 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12334 as_warn_where (fragP->fr_file, fragP->fr_line,
12335 _("long jump required"));
12336
12337 switch (fragP->fr_subtype)
12338 {
12339 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12340 extension = 4; /* 1 opcode + 4 displacement */
12341 opcode[0] = 0xe9;
12342 where_to_put_displacement = &opcode[1];
12343 break;
12344
12345 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12346 extension = 2; /* 1 opcode + 2 displacement */
12347 opcode[0] = 0xe9;
12348 where_to_put_displacement = &opcode[1];
12349 break;
12350
12351 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12352 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12353 extension = 5; /* 2 opcode + 4 displacement */
12354 opcode[1] = opcode[0] + 0x10;
12355 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12356 where_to_put_displacement = &opcode[2];
12357 break;
12358
12359 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12360 extension = 3; /* 2 opcode + 2 displacement */
12361 opcode[1] = opcode[0] + 0x10;
12362 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12363 where_to_put_displacement = &opcode[2];
12364 break;
12365
12366 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12367 extension = 4;
12368 opcode[0] ^= 1;
12369 opcode[1] = 3;
12370 opcode[2] = 0xe9;
12371 where_to_put_displacement = &opcode[3];
12372 break;
12373
12374 default:
12375 BAD_CASE (fragP->fr_subtype);
12376 break;
12377 }
12378 }
12379
12380 /* If size if less then four we are sure that the operand fits,
12381 but if it's 4, then it could be that the displacement is larger
12382 then -/+ 2GB. */
12383 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12384 && object_64bit
12385 && ((addressT) (displacement_from_opcode_start - extension
12386 + ((addressT) 1 << 31))
12387 > (((addressT) 2 << 31) - 1)))
12388 {
12389 as_bad_where (fragP->fr_file, fragP->fr_line,
12390 _("jump target out of range"));
12391 /* Make us emit 0. */
12392 displacement_from_opcode_start = extension;
12393 }
12394 /* Now put displacement after opcode. */
12395 md_number_to_chars ((char *) where_to_put_displacement,
12396 (valueT) (displacement_from_opcode_start - extension),
12397 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12398 fragP->fr_fix += extension;
12399 }
12400 \f
12401 /* Apply a fixup (fixP) to segment data, once it has been determined
12402 by our caller that we have all the info we need to fix it up.
12403
12404 Parameter valP is the pointer to the value of the bits.
12405
12406 On the 386, immediates, displacements, and data pointers are all in
12407 the same (little-endian) format, so we don't need to care about which
12408 we are handling. */
12409
12410 void
12411 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12412 {
12413 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12414 valueT value = *valP;
12415
12416 #if !defined (TE_Mach)
12417 if (fixP->fx_pcrel)
12418 {
12419 switch (fixP->fx_r_type)
12420 {
12421 default:
12422 break;
12423
12424 case BFD_RELOC_64:
12425 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12426 break;
12427 case BFD_RELOC_32:
12428 case BFD_RELOC_X86_64_32S:
12429 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12430 break;
12431 case BFD_RELOC_16:
12432 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12433 break;
12434 case BFD_RELOC_8:
12435 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12436 break;
12437 }
12438 }
12439
12440 if (fixP->fx_addsy != NULL
12441 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12442 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12443 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12444 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12445 && !use_rela_relocations)
12446 {
12447 /* This is a hack. There should be a better way to handle this.
12448 This covers for the fact that bfd_install_relocation will
12449 subtract the current location (for partial_inplace, PC relative
12450 relocations); see more below. */
12451 #ifndef OBJ_AOUT
12452 if (IS_ELF
12453 #ifdef TE_PE
12454 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12455 #endif
12456 )
12457 value += fixP->fx_where + fixP->fx_frag->fr_address;
12458 #endif
12459 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12460 if (IS_ELF)
12461 {
12462 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12463
12464 if ((sym_seg == seg
12465 || (symbol_section_p (fixP->fx_addsy)
12466 && sym_seg != absolute_section))
12467 && !generic_force_reloc (fixP))
12468 {
12469 /* Yes, we add the values in twice. This is because
12470 bfd_install_relocation subtracts them out again. I think
12471 bfd_install_relocation is broken, but I don't dare change
12472 it. FIXME. */
12473 value += fixP->fx_where + fixP->fx_frag->fr_address;
12474 }
12475 }
12476 #endif
12477 #if defined (OBJ_COFF) && defined (TE_PE)
12478 /* For some reason, the PE format does not store a
12479 section address offset for a PC relative symbol. */
12480 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12481 || S_IS_WEAK (fixP->fx_addsy))
12482 value += md_pcrel_from (fixP);
12483 #endif
12484 }
12485 #if defined (OBJ_COFF) && defined (TE_PE)
12486 if (fixP->fx_addsy != NULL
12487 && S_IS_WEAK (fixP->fx_addsy)
12488 /* PR 16858: Do not modify weak function references. */
12489 && ! fixP->fx_pcrel)
12490 {
12491 #if !defined (TE_PEP)
12492 /* For x86 PE weak function symbols are neither PC-relative
12493 nor do they set S_IS_FUNCTION. So the only reliable way
12494 to detect them is to check the flags of their containing
12495 section. */
12496 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12497 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12498 ;
12499 else
12500 #endif
12501 value -= S_GET_VALUE (fixP->fx_addsy);
12502 }
12503 #endif
12504
12505 /* Fix a few things - the dynamic linker expects certain values here,
12506 and we must not disappoint it. */
12507 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12508 if (IS_ELF && fixP->fx_addsy)
12509 switch (fixP->fx_r_type)
12510 {
12511 case BFD_RELOC_386_PLT32:
12512 case BFD_RELOC_X86_64_PLT32:
12513 /* Make the jump instruction point to the address of the operand.
12514 At runtime we merely add the offset to the actual PLT entry.
12515 NB: Subtract the offset size only for jump instructions. */
12516 if (fixP->fx_pcrel)
12517 value = -4;
12518 break;
12519
12520 case BFD_RELOC_386_TLS_GD:
12521 case BFD_RELOC_386_TLS_LDM:
12522 case BFD_RELOC_386_TLS_IE_32:
12523 case BFD_RELOC_386_TLS_IE:
12524 case BFD_RELOC_386_TLS_GOTIE:
12525 case BFD_RELOC_386_TLS_GOTDESC:
12526 case BFD_RELOC_X86_64_TLSGD:
12527 case BFD_RELOC_X86_64_TLSLD:
12528 case BFD_RELOC_X86_64_GOTTPOFF:
12529 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12530 value = 0; /* Fully resolved at runtime. No addend. */
12531 /* Fallthrough */
12532 case BFD_RELOC_386_TLS_LE:
12533 case BFD_RELOC_386_TLS_LDO_32:
12534 case BFD_RELOC_386_TLS_LE_32:
12535 case BFD_RELOC_X86_64_DTPOFF32:
12536 case BFD_RELOC_X86_64_DTPOFF64:
12537 case BFD_RELOC_X86_64_TPOFF32:
12538 case BFD_RELOC_X86_64_TPOFF64:
12539 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12540 break;
12541
12542 case BFD_RELOC_386_TLS_DESC_CALL:
12543 case BFD_RELOC_X86_64_TLSDESC_CALL:
12544 value = 0; /* Fully resolved at runtime. No addend. */
12545 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12546 fixP->fx_done = 0;
12547 return;
12548
12549 case BFD_RELOC_VTABLE_INHERIT:
12550 case BFD_RELOC_VTABLE_ENTRY:
12551 fixP->fx_done = 0;
12552 return;
12553
12554 default:
12555 break;
12556 }
12557 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12558 *valP = value;
12559 #endif /* !defined (TE_Mach) */
12560
12561 /* Are we finished with this relocation now? */
12562 if (fixP->fx_addsy == NULL)
12563 fixP->fx_done = 1;
12564 #if defined (OBJ_COFF) && defined (TE_PE)
12565 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12566 {
12567 fixP->fx_done = 0;
12568 /* Remember value for tc_gen_reloc. */
12569 fixP->fx_addnumber = value;
12570 /* Clear out the frag for now. */
12571 value = 0;
12572 }
12573 #endif
12574 else if (use_rela_relocations)
12575 {
12576 fixP->fx_no_overflow = 1;
12577 /* Remember value for tc_gen_reloc. */
12578 fixP->fx_addnumber = value;
12579 value = 0;
12580 }
12581
12582 md_number_to_chars (p, value, fixP->fx_size);
12583 }
12584 \f
12585 const char *
12586 md_atof (int type, char *litP, int *sizeP)
12587 {
12588 /* This outputs the LITTLENUMs in REVERSE order;
12589 in accord with the bigendian 386. */
12590 return ieee_md_atof (type, litP, sizeP, FALSE);
12591 }
12592 \f
12593 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12594
12595 static char *
12596 output_invalid (int c)
12597 {
12598 if (ISPRINT (c))
12599 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12600 "'%c'", c);
12601 else
12602 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12603 "(0x%x)", (unsigned char) c);
12604 return output_invalid_buf;
12605 }
12606
12607 /* Verify that @r can be used in the current context. */
12608
12609 static bfd_boolean check_register (const reg_entry *r)
12610 {
12611 if (allow_pseudo_reg)
12612 return TRUE;
12613
12614 if (operand_type_all_zero (&r->reg_type))
12615 return FALSE;
12616
12617 if ((r->reg_type.bitfield.dword
12618 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12619 || r->reg_type.bitfield.class == RegCR
12620 || r->reg_type.bitfield.class == RegDR)
12621 && !cpu_arch_flags.bitfield.cpui386)
12622 return FALSE;
12623
12624 if (r->reg_type.bitfield.class == RegTR
12625 && (flag_code == CODE_64BIT
12626 || !cpu_arch_flags.bitfield.cpui386
12627 || cpu_arch_isa_flags.bitfield.cpui586
12628 || cpu_arch_isa_flags.bitfield.cpui686))
12629 return FALSE;
12630
12631 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12632 return FALSE;
12633
12634 if (!cpu_arch_flags.bitfield.cpuavx512f)
12635 {
12636 if (r->reg_type.bitfield.zmmword
12637 || r->reg_type.bitfield.class == RegMask)
12638 return FALSE;
12639
12640 if (!cpu_arch_flags.bitfield.cpuavx)
12641 {
12642 if (r->reg_type.bitfield.ymmword)
12643 return FALSE;
12644
12645 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12646 return FALSE;
12647 }
12648 }
12649
12650 if (r->reg_type.bitfield.tmmword
12651 && (!cpu_arch_flags.bitfield.cpuamx_tile
12652 || flag_code != CODE_64BIT))
12653 return FALSE;
12654
12655 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12656 return FALSE;
12657
12658 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12659 if (!allow_index_reg && r->reg_num == RegIZ)
12660 return FALSE;
12661
12662 /* Upper 16 vector registers are only available with VREX in 64bit
12663 mode, and require EVEX encoding. */
12664 if (r->reg_flags & RegVRex)
12665 {
12666 if (!cpu_arch_flags.bitfield.cpuavx512f
12667 || flag_code != CODE_64BIT)
12668 return FALSE;
12669
12670 if (i.vec_encoding == vex_encoding_default)
12671 i.vec_encoding = vex_encoding_evex;
12672 else if (i.vec_encoding != vex_encoding_evex)
12673 i.vec_encoding = vex_encoding_error;
12674 }
12675
12676 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12677 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12678 && flag_code != CODE_64BIT)
12679 return FALSE;
12680
12681 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12682 && !intel_syntax)
12683 return FALSE;
12684
12685 return TRUE;
12686 }
12687
12688 /* REG_STRING starts *before* REGISTER_PREFIX. */
12689
12690 static const reg_entry *
12691 parse_real_register (char *reg_string, char **end_op)
12692 {
12693 char *s = reg_string;
12694 char *p;
12695 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12696 const reg_entry *r;
12697
12698 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12699 if (*s == REGISTER_PREFIX)
12700 ++s;
12701
12702 if (is_space_char (*s))
12703 ++s;
12704
12705 p = reg_name_given;
12706 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12707 {
12708 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12709 return (const reg_entry *) NULL;
12710 s++;
12711 }
12712
12713 /* For naked regs, make sure that we are not dealing with an identifier.
12714 This prevents confusing an identifier like `eax_var' with register
12715 `eax'. */
12716 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12717 return (const reg_entry *) NULL;
12718
12719 *end_op = s;
12720
12721 r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12722
12723 /* Handle floating point regs, allowing spaces in the (i) part. */
12724 if (r == i386_regtab /* %st is first entry of table */)
12725 {
12726 if (!cpu_arch_flags.bitfield.cpu8087
12727 && !cpu_arch_flags.bitfield.cpu287
12728 && !cpu_arch_flags.bitfield.cpu387
12729 && !allow_pseudo_reg)
12730 return (const reg_entry *) NULL;
12731
12732 if (is_space_char (*s))
12733 ++s;
12734 if (*s == '(')
12735 {
12736 ++s;
12737 if (is_space_char (*s))
12738 ++s;
12739 if (*s >= '0' && *s <= '7')
12740 {
12741 int fpr = *s - '0';
12742 ++s;
12743 if (is_space_char (*s))
12744 ++s;
12745 if (*s == ')')
12746 {
12747 *end_op = s + 1;
12748 r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12749 know (r);
12750 return r + fpr;
12751 }
12752 }
12753 /* We have "%st(" then garbage. */
12754 return (const reg_entry *) NULL;
12755 }
12756 }
12757
12758 return r && check_register (r) ? r : NULL;
12759 }
12760
12761 /* REG_STRING starts *before* REGISTER_PREFIX. */
12762
12763 static const reg_entry *
12764 parse_register (char *reg_string, char **end_op)
12765 {
12766 const reg_entry *r;
12767
12768 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12769 r = parse_real_register (reg_string, end_op);
12770 else
12771 r = NULL;
12772 if (!r)
12773 {
12774 char *save = input_line_pointer;
12775 char c;
12776 symbolS *symbolP;
12777
12778 input_line_pointer = reg_string;
12779 c = get_symbol_name (&reg_string);
12780 symbolP = symbol_find (reg_string);
12781 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12782 {
12783 const expressionS *e = symbol_get_value_expression (symbolP);
12784
12785 know (e->X_op == O_register);
12786 know (e->X_add_number >= 0
12787 && (valueT) e->X_add_number < i386_regtab_size);
12788 r = i386_regtab + e->X_add_number;
12789 if (!check_register (r))
12790 {
12791 as_bad (_("register '%s%s' cannot be used here"),
12792 register_prefix, r->reg_name);
12793 r = &bad_reg;
12794 }
12795 *end_op = input_line_pointer;
12796 }
12797 *input_line_pointer = c;
12798 input_line_pointer = save;
12799 }
12800 return r;
12801 }
12802
12803 int
12804 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12805 {
12806 const reg_entry *r;
12807 char *end = input_line_pointer;
12808
12809 *end = *nextcharP;
12810 r = parse_register (name, &input_line_pointer);
12811 if (r && end <= input_line_pointer)
12812 {
12813 *nextcharP = *input_line_pointer;
12814 *input_line_pointer = 0;
12815 if (r != &bad_reg)
12816 {
12817 e->X_op = O_register;
12818 e->X_add_number = r - i386_regtab;
12819 }
12820 else
12821 e->X_op = O_illegal;
12822 return 1;
12823 }
12824 input_line_pointer = end;
12825 *end = 0;
12826 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12827 }
12828
12829 void
12830 md_operand (expressionS *e)
12831 {
12832 char *end;
12833 const reg_entry *r;
12834
12835 switch (*input_line_pointer)
12836 {
12837 case REGISTER_PREFIX:
12838 r = parse_real_register (input_line_pointer, &end);
12839 if (r)
12840 {
12841 e->X_op = O_register;
12842 e->X_add_number = r - i386_regtab;
12843 input_line_pointer = end;
12844 }
12845 break;
12846
12847 case '[':
12848 gas_assert (intel_syntax);
12849 end = input_line_pointer++;
12850 expression (e);
12851 if (*input_line_pointer == ']')
12852 {
12853 ++input_line_pointer;
12854 e->X_op_symbol = make_expr_symbol (e);
12855 e->X_add_symbol = NULL;
12856 e->X_add_number = 0;
12857 e->X_op = O_index;
12858 }
12859 else
12860 {
12861 e->X_op = O_absent;
12862 input_line_pointer = end;
12863 }
12864 break;
12865 }
12866 }
12867
12868 \f
12869 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12870 const char *md_shortopts = "kVQ:sqnO::";
12871 #else
12872 const char *md_shortopts = "qnO::";
12873 #endif
12874
12875 #define OPTION_32 (OPTION_MD_BASE + 0)
12876 #define OPTION_64 (OPTION_MD_BASE + 1)
12877 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12878 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12879 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12880 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12881 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12882 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12883 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12884 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12885 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12886 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12887 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12888 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12889 #define OPTION_X32 (OPTION_MD_BASE + 14)
12890 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12891 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12892 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12893 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12894 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12895 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12896 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12897 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12898 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12899 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12900 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12901 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12902 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12903 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12904 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12905 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12906 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12907 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12908 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12909
12910 struct option md_longopts[] =
12911 {
12912 {"32", no_argument, NULL, OPTION_32},
12913 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12914 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12915 {"64", no_argument, NULL, OPTION_64},
12916 #endif
12917 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12918 {"x32", no_argument, NULL, OPTION_X32},
12919 {"mshared", no_argument, NULL, OPTION_MSHARED},
12920 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12921 #endif
12922 {"divide", no_argument, NULL, OPTION_DIVIDE},
12923 {"march", required_argument, NULL, OPTION_MARCH},
12924 {"mtune", required_argument, NULL, OPTION_MTUNE},
12925 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12926 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12927 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12928 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12929 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12930 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12931 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12932 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12933 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12934 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12935 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12936 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12937 # if defined (TE_PE) || defined (TE_PEP)
12938 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12939 #endif
12940 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12941 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12942 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12943 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12944 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12945 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12946 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12947 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12948 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12949 {"mlfence-before-indirect-branch", required_argument, NULL,
12950 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12951 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12952 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12953 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12954 {NULL, no_argument, NULL, 0}
12955 };
12956 size_t md_longopts_size = sizeof (md_longopts);
12957
12958 int
12959 md_parse_option (int c, const char *arg)
12960 {
12961 unsigned int j;
12962 char *arch, *next, *saved, *type;
12963
12964 switch (c)
12965 {
12966 case 'n':
12967 optimize_align_code = 0;
12968 break;
12969
12970 case 'q':
12971 quiet_warnings = 1;
12972 break;
12973
12974 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12975 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12976 should be emitted or not. FIXME: Not implemented. */
12977 case 'Q':
12978 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12979 return 0;
12980 break;
12981
12982 /* -V: SVR4 argument to print version ID. */
12983 case 'V':
12984 print_version_id ();
12985 break;
12986
12987 /* -k: Ignore for FreeBSD compatibility. */
12988 case 'k':
12989 break;
12990
12991 case 's':
12992 /* -s: On i386 Solaris, this tells the native assembler to use
12993 .stab instead of .stab.excl. We always use .stab anyhow. */
12994 break;
12995
12996 case OPTION_MSHARED:
12997 shared = 1;
12998 break;
12999
13000 case OPTION_X86_USED_NOTE:
13001 if (strcasecmp (arg, "yes") == 0)
13002 x86_used_note = 1;
13003 else if (strcasecmp (arg, "no") == 0)
13004 x86_used_note = 0;
13005 else
13006 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
13007 break;
13008
13009
13010 #endif
13011 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13012 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13013 case OPTION_64:
13014 {
13015 const char **list, **l;
13016
13017 list = bfd_target_list ();
13018 for (l = list; *l != NULL; l++)
13019 if (CONST_STRNEQ (*l, "elf64-x86-64")
13020 || strcmp (*l, "coff-x86-64") == 0
13021 || strcmp (*l, "pe-x86-64") == 0
13022 || strcmp (*l, "pei-x86-64") == 0
13023 || strcmp (*l, "mach-o-x86-64") == 0)
13024 {
13025 default_arch = "x86_64";
13026 break;
13027 }
13028 if (*l == NULL)
13029 as_fatal (_("no compiled in support for x86_64"));
13030 free (list);
13031 }
13032 break;
13033 #endif
13034
13035 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13036 case OPTION_X32:
13037 if (IS_ELF)
13038 {
13039 const char **list, **l;
13040
13041 list = bfd_target_list ();
13042 for (l = list; *l != NULL; l++)
13043 if (CONST_STRNEQ (*l, "elf32-x86-64"))
13044 {
13045 default_arch = "x86_64:32";
13046 break;
13047 }
13048 if (*l == NULL)
13049 as_fatal (_("no compiled in support for 32bit x86_64"));
13050 free (list);
13051 }
13052 else
13053 as_fatal (_("32bit x86_64 is only supported for ELF"));
13054 break;
13055 #endif
13056
13057 case OPTION_32:
13058 default_arch = "i386";
13059 break;
13060
13061 case OPTION_DIVIDE:
13062 #ifdef SVR4_COMMENT_CHARS
13063 {
13064 char *n, *t;
13065 const char *s;
13066
13067 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13068 t = n;
13069 for (s = i386_comment_chars; *s != '\0'; s++)
13070 if (*s != '/')
13071 *t++ = *s;
13072 *t = '\0';
13073 i386_comment_chars = n;
13074 }
13075 #endif
13076 break;
13077
13078 case OPTION_MARCH:
13079 saved = xstrdup (arg);
13080 arch = saved;
13081 /* Allow -march=+nosse. */
13082 if (*arch == '+')
13083 arch++;
13084 do
13085 {
13086 if (*arch == '.')
13087 as_fatal (_("invalid -march= option: `%s'"), arg);
13088 next = strchr (arch, '+');
13089 if (next)
13090 *next++ = '\0';
13091 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13092 {
13093 if (strcmp (arch, cpu_arch [j].name) == 0)
13094 {
13095 /* Processor. */
13096 if (! cpu_arch[j].flags.bitfield.cpui386)
13097 continue;
13098
13099 cpu_arch_name = cpu_arch[j].name;
13100 cpu_sub_arch_name = NULL;
13101 cpu_arch_flags = cpu_arch[j].flags;
13102 cpu_arch_isa = cpu_arch[j].type;
13103 cpu_arch_isa_flags = cpu_arch[j].flags;
13104 if (!cpu_arch_tune_set)
13105 {
13106 cpu_arch_tune = cpu_arch_isa;
13107 cpu_arch_tune_flags = cpu_arch_isa_flags;
13108 }
13109 break;
13110 }
13111 else if (*cpu_arch [j].name == '.'
13112 && strcmp (arch, cpu_arch [j].name + 1) == 0)
13113 {
13114 /* ISA extension. */
13115 i386_cpu_flags flags;
13116
13117 flags = cpu_flags_or (cpu_arch_flags,
13118 cpu_arch[j].flags);
13119
13120 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13121 {
13122 if (cpu_sub_arch_name)
13123 {
13124 char *name = cpu_sub_arch_name;
13125 cpu_sub_arch_name = concat (name,
13126 cpu_arch[j].name,
13127 (const char *) NULL);
13128 free (name);
13129 }
13130 else
13131 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13132 cpu_arch_flags = flags;
13133 cpu_arch_isa_flags = flags;
13134 }
13135 else
13136 cpu_arch_isa_flags
13137 = cpu_flags_or (cpu_arch_isa_flags,
13138 cpu_arch[j].flags);
13139 break;
13140 }
13141 }
13142
13143 if (j >= ARRAY_SIZE (cpu_arch))
13144 {
13145 /* Disable an ISA extension. */
13146 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13147 if (strcmp (arch, cpu_noarch [j].name) == 0)
13148 {
13149 i386_cpu_flags flags;
13150
13151 flags = cpu_flags_and_not (cpu_arch_flags,
13152 cpu_noarch[j].flags);
13153 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13154 {
13155 if (cpu_sub_arch_name)
13156 {
13157 char *name = cpu_sub_arch_name;
13158 cpu_sub_arch_name = concat (arch,
13159 (const char *) NULL);
13160 free (name);
13161 }
13162 else
13163 cpu_sub_arch_name = xstrdup (arch);
13164 cpu_arch_flags = flags;
13165 cpu_arch_isa_flags = flags;
13166 }
13167 break;
13168 }
13169
13170 if (j >= ARRAY_SIZE (cpu_noarch))
13171 j = ARRAY_SIZE (cpu_arch);
13172 }
13173
13174 if (j >= ARRAY_SIZE (cpu_arch))
13175 as_fatal (_("invalid -march= option: `%s'"), arg);
13176
13177 arch = next;
13178 }
13179 while (next != NULL);
13180 free (saved);
13181 break;
13182
13183 case OPTION_MTUNE:
13184 if (*arg == '.')
13185 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13186 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13187 {
13188 if (strcmp (arg, cpu_arch [j].name) == 0)
13189 {
13190 cpu_arch_tune_set = 1;
13191 cpu_arch_tune = cpu_arch [j].type;
13192 cpu_arch_tune_flags = cpu_arch[j].flags;
13193 break;
13194 }
13195 }
13196 if (j >= ARRAY_SIZE (cpu_arch))
13197 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13198 break;
13199
13200 case OPTION_MMNEMONIC:
13201 if (strcasecmp (arg, "att") == 0)
13202 intel_mnemonic = 0;
13203 else if (strcasecmp (arg, "intel") == 0)
13204 intel_mnemonic = 1;
13205 else
13206 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13207 break;
13208
13209 case OPTION_MSYNTAX:
13210 if (strcasecmp (arg, "att") == 0)
13211 intel_syntax = 0;
13212 else if (strcasecmp (arg, "intel") == 0)
13213 intel_syntax = 1;
13214 else
13215 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13216 break;
13217
13218 case OPTION_MINDEX_REG:
13219 allow_index_reg = 1;
13220 break;
13221
13222 case OPTION_MNAKED_REG:
13223 allow_naked_reg = 1;
13224 break;
13225
13226 case OPTION_MSSE2AVX:
13227 sse2avx = 1;
13228 break;
13229
13230 case OPTION_MSSE_CHECK:
13231 if (strcasecmp (arg, "error") == 0)
13232 sse_check = check_error;
13233 else if (strcasecmp (arg, "warning") == 0)
13234 sse_check = check_warning;
13235 else if (strcasecmp (arg, "none") == 0)
13236 sse_check = check_none;
13237 else
13238 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13239 break;
13240
13241 case OPTION_MOPERAND_CHECK:
13242 if (strcasecmp (arg, "error") == 0)
13243 operand_check = check_error;
13244 else if (strcasecmp (arg, "warning") == 0)
13245 operand_check = check_warning;
13246 else if (strcasecmp (arg, "none") == 0)
13247 operand_check = check_none;
13248 else
13249 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13250 break;
13251
13252 case OPTION_MAVXSCALAR:
13253 if (strcasecmp (arg, "128") == 0)
13254 avxscalar = vex128;
13255 else if (strcasecmp (arg, "256") == 0)
13256 avxscalar = vex256;
13257 else
13258 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13259 break;
13260
13261 case OPTION_MVEXWIG:
13262 if (strcmp (arg, "0") == 0)
13263 vexwig = vexw0;
13264 else if (strcmp (arg, "1") == 0)
13265 vexwig = vexw1;
13266 else
13267 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13268 break;
13269
13270 case OPTION_MADD_BND_PREFIX:
13271 add_bnd_prefix = 1;
13272 break;
13273
13274 case OPTION_MEVEXLIG:
13275 if (strcmp (arg, "128") == 0)
13276 evexlig = evexl128;
13277 else if (strcmp (arg, "256") == 0)
13278 evexlig = evexl256;
13279 else if (strcmp (arg, "512") == 0)
13280 evexlig = evexl512;
13281 else
13282 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13283 break;
13284
13285 case OPTION_MEVEXRCIG:
13286 if (strcmp (arg, "rne") == 0)
13287 evexrcig = rne;
13288 else if (strcmp (arg, "rd") == 0)
13289 evexrcig = rd;
13290 else if (strcmp (arg, "ru") == 0)
13291 evexrcig = ru;
13292 else if (strcmp (arg, "rz") == 0)
13293 evexrcig = rz;
13294 else
13295 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13296 break;
13297
13298 case OPTION_MEVEXWIG:
13299 if (strcmp (arg, "0") == 0)
13300 evexwig = evexw0;
13301 else if (strcmp (arg, "1") == 0)
13302 evexwig = evexw1;
13303 else
13304 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13305 break;
13306
13307 # if defined (TE_PE) || defined (TE_PEP)
13308 case OPTION_MBIG_OBJ:
13309 use_big_obj = 1;
13310 break;
13311 #endif
13312
13313 case OPTION_MOMIT_LOCK_PREFIX:
13314 if (strcasecmp (arg, "yes") == 0)
13315 omit_lock_prefix = 1;
13316 else if (strcasecmp (arg, "no") == 0)
13317 omit_lock_prefix = 0;
13318 else
13319 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13320 break;
13321
13322 case OPTION_MFENCE_AS_LOCK_ADD:
13323 if (strcasecmp (arg, "yes") == 0)
13324 avoid_fence = 1;
13325 else if (strcasecmp (arg, "no") == 0)
13326 avoid_fence = 0;
13327 else
13328 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13329 break;
13330
13331 case OPTION_MLFENCE_AFTER_LOAD:
13332 if (strcasecmp (arg, "yes") == 0)
13333 lfence_after_load = 1;
13334 else if (strcasecmp (arg, "no") == 0)
13335 lfence_after_load = 0;
13336 else
13337 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13338 break;
13339
13340 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13341 if (strcasecmp (arg, "all") == 0)
13342 {
13343 lfence_before_indirect_branch = lfence_branch_all;
13344 if (lfence_before_ret == lfence_before_ret_none)
13345 lfence_before_ret = lfence_before_ret_shl;
13346 }
13347 else if (strcasecmp (arg, "memory") == 0)
13348 lfence_before_indirect_branch = lfence_branch_memory;
13349 else if (strcasecmp (arg, "register") == 0)
13350 lfence_before_indirect_branch = lfence_branch_register;
13351 else if (strcasecmp (arg, "none") == 0)
13352 lfence_before_indirect_branch = lfence_branch_none;
13353 else
13354 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13355 arg);
13356 break;
13357
13358 case OPTION_MLFENCE_BEFORE_RET:
13359 if (strcasecmp (arg, "or") == 0)
13360 lfence_before_ret = lfence_before_ret_or;
13361 else if (strcasecmp (arg, "not") == 0)
13362 lfence_before_ret = lfence_before_ret_not;
13363 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13364 lfence_before_ret = lfence_before_ret_shl;
13365 else if (strcasecmp (arg, "none") == 0)
13366 lfence_before_ret = lfence_before_ret_none;
13367 else
13368 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13369 arg);
13370 break;
13371
13372 case OPTION_MRELAX_RELOCATIONS:
13373 if (strcasecmp (arg, "yes") == 0)
13374 generate_relax_relocations = 1;
13375 else if (strcasecmp (arg, "no") == 0)
13376 generate_relax_relocations = 0;
13377 else
13378 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13379 break;
13380
13381 case OPTION_MALIGN_BRANCH_BOUNDARY:
13382 {
13383 char *end;
13384 long int align = strtoul (arg, &end, 0);
13385 if (*end == '\0')
13386 {
13387 if (align == 0)
13388 {
13389 align_branch_power = 0;
13390 break;
13391 }
13392 else if (align >= 16)
13393 {
13394 int align_power;
13395 for (align_power = 0;
13396 (align & 1) == 0;
13397 align >>= 1, align_power++)
13398 continue;
13399 /* Limit alignment power to 31. */
13400 if (align == 1 && align_power < 32)
13401 {
13402 align_branch_power = align_power;
13403 break;
13404 }
13405 }
13406 }
13407 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13408 }
13409 break;
13410
13411 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13412 {
13413 char *end;
13414 int align = strtoul (arg, &end, 0);
13415 /* Some processors only support 5 prefixes. */
13416 if (*end == '\0' && align >= 0 && align < 6)
13417 {
13418 align_branch_prefix_size = align;
13419 break;
13420 }
13421 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13422 arg);
13423 }
13424 break;
13425
13426 case OPTION_MALIGN_BRANCH:
13427 align_branch = 0;
13428 saved = xstrdup (arg);
13429 type = saved;
13430 do
13431 {
13432 next = strchr (type, '+');
13433 if (next)
13434 *next++ = '\0';
13435 if (strcasecmp (type, "jcc") == 0)
13436 align_branch |= align_branch_jcc_bit;
13437 else if (strcasecmp (type, "fused") == 0)
13438 align_branch |= align_branch_fused_bit;
13439 else if (strcasecmp (type, "jmp") == 0)
13440 align_branch |= align_branch_jmp_bit;
13441 else if (strcasecmp (type, "call") == 0)
13442 align_branch |= align_branch_call_bit;
13443 else if (strcasecmp (type, "ret") == 0)
13444 align_branch |= align_branch_ret_bit;
13445 else if (strcasecmp (type, "indirect") == 0)
13446 align_branch |= align_branch_indirect_bit;
13447 else
13448 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13449 type = next;
13450 }
13451 while (next != NULL);
13452 free (saved);
13453 break;
13454
13455 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13456 align_branch_power = 5;
13457 align_branch_prefix_size = 5;
13458 align_branch = (align_branch_jcc_bit
13459 | align_branch_fused_bit
13460 | align_branch_jmp_bit);
13461 break;
13462
13463 case OPTION_MAMD64:
13464 isa64 = amd64;
13465 break;
13466
13467 case OPTION_MINTEL64:
13468 isa64 = intel64;
13469 break;
13470
13471 case 'O':
13472 if (arg == NULL)
13473 {
13474 optimize = 1;
13475 /* Turn off -Os. */
13476 optimize_for_space = 0;
13477 }
13478 else if (*arg == 's')
13479 {
13480 optimize_for_space = 1;
13481 /* Turn on all encoding optimizations. */
13482 optimize = INT_MAX;
13483 }
13484 else
13485 {
13486 optimize = atoi (arg);
13487 /* Turn off -Os. */
13488 optimize_for_space = 0;
13489 }
13490 break;
13491
13492 default:
13493 return 0;
13494 }
13495 return 1;
13496 }
13497
13498 #define MESSAGE_TEMPLATE \
13499 " "
13500
13501 static char *
13502 output_message (FILE *stream, char *p, char *message, char *start,
13503 int *left_p, const char *name, int len)
13504 {
13505 int size = sizeof (MESSAGE_TEMPLATE);
13506 int left = *left_p;
13507
13508 /* Reserve 2 spaces for ", " or ",\0" */
13509 left -= len + 2;
13510
13511 /* Check if there is any room. */
13512 if (left >= 0)
13513 {
13514 if (p != start)
13515 {
13516 *p++ = ',';
13517 *p++ = ' ';
13518 }
13519 p = mempcpy (p, name, len);
13520 }
13521 else
13522 {
13523 /* Output the current message now and start a new one. */
13524 *p++ = ',';
13525 *p = '\0';
13526 fprintf (stream, "%s\n", message);
13527 p = start;
13528 left = size - (start - message) - len - 2;
13529
13530 gas_assert (left >= 0);
13531
13532 p = mempcpy (p, name, len);
13533 }
13534
13535 *left_p = left;
13536 return p;
13537 }
13538
13539 static void
13540 show_arch (FILE *stream, int ext, int check)
13541 {
13542 static char message[] = MESSAGE_TEMPLATE;
13543 char *start = message + 27;
13544 char *p;
13545 int size = sizeof (MESSAGE_TEMPLATE);
13546 int left;
13547 const char *name;
13548 int len;
13549 unsigned int j;
13550
13551 p = start;
13552 left = size - (start - message);
13553 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13554 {
13555 /* Should it be skipped? */
13556 if (cpu_arch [j].skip)
13557 continue;
13558
13559 name = cpu_arch [j].name;
13560 len = cpu_arch [j].len;
13561 if (*name == '.')
13562 {
13563 /* It is an extension. Skip if we aren't asked to show it. */
13564 if (ext)
13565 {
13566 name++;
13567 len--;
13568 }
13569 else
13570 continue;
13571 }
13572 else if (ext)
13573 {
13574 /* It is an processor. Skip if we show only extension. */
13575 continue;
13576 }
13577 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13578 {
13579 /* It is an impossible processor - skip. */
13580 continue;
13581 }
13582
13583 p = output_message (stream, p, message, start, &left, name, len);
13584 }
13585
13586 /* Display disabled extensions. */
13587 if (ext)
13588 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13589 {
13590 name = cpu_noarch [j].name;
13591 len = cpu_noarch [j].len;
13592 p = output_message (stream, p, message, start, &left, name,
13593 len);
13594 }
13595
13596 *p = '\0';
13597 fprintf (stream, "%s\n", message);
13598 }
13599
13600 void
13601 md_show_usage (FILE *stream)
13602 {
13603 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13604 fprintf (stream, _("\
13605 -Qy, -Qn ignored\n\
13606 -V print assembler version number\n\
13607 -k ignored\n"));
13608 #endif
13609 fprintf (stream, _("\
13610 -n Do not optimize code alignment\n\
13611 -q quieten some warnings\n"));
13612 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13613 fprintf (stream, _("\
13614 -s ignored\n"));
13615 #endif
13616 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13617 || defined (TE_PE) || defined (TE_PEP))
13618 fprintf (stream, _("\
13619 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13620 #endif
13621 #ifdef SVR4_COMMENT_CHARS
13622 fprintf (stream, _("\
13623 --divide do not treat `/' as a comment character\n"));
13624 #else
13625 fprintf (stream, _("\
13626 --divide ignored\n"));
13627 #endif
13628 fprintf (stream, _("\
13629 -march=CPU[,+EXTENSION...]\n\
13630 generate code for CPU and EXTENSION, CPU is one of:\n"));
13631 show_arch (stream, 0, 1);
13632 fprintf (stream, _("\
13633 EXTENSION is combination of:\n"));
13634 show_arch (stream, 1, 0);
13635 fprintf (stream, _("\
13636 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13637 show_arch (stream, 0, 0);
13638 fprintf (stream, _("\
13639 -msse2avx encode SSE instructions with VEX prefix\n"));
13640 fprintf (stream, _("\
13641 -msse-check=[none|error|warning] (default: warning)\n\
13642 check SSE instructions\n"));
13643 fprintf (stream, _("\
13644 -moperand-check=[none|error|warning] (default: warning)\n\
13645 check operand combinations for validity\n"));
13646 fprintf (stream, _("\
13647 -mavxscalar=[128|256] (default: 128)\n\
13648 encode scalar AVX instructions with specific vector\n\
13649 length\n"));
13650 fprintf (stream, _("\
13651 -mvexwig=[0|1] (default: 0)\n\
13652 encode VEX instructions with specific VEX.W value\n\
13653 for VEX.W bit ignored instructions\n"));
13654 fprintf (stream, _("\
13655 -mevexlig=[128|256|512] (default: 128)\n\
13656 encode scalar EVEX instructions with specific vector\n\
13657 length\n"));
13658 fprintf (stream, _("\
13659 -mevexwig=[0|1] (default: 0)\n\
13660 encode EVEX instructions with specific EVEX.W value\n\
13661 for EVEX.W bit ignored instructions\n"));
13662 fprintf (stream, _("\
13663 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13664 encode EVEX instructions with specific EVEX.RC value\n\
13665 for SAE-only ignored instructions\n"));
13666 fprintf (stream, _("\
13667 -mmnemonic=[att|intel] "));
13668 if (SYSV386_COMPAT)
13669 fprintf (stream, _("(default: att)\n"));
13670 else
13671 fprintf (stream, _("(default: intel)\n"));
13672 fprintf (stream, _("\
13673 use AT&T/Intel mnemonic\n"));
13674 fprintf (stream, _("\
13675 -msyntax=[att|intel] (default: att)\n\
13676 use AT&T/Intel syntax\n"));
13677 fprintf (stream, _("\
13678 -mindex-reg support pseudo index registers\n"));
13679 fprintf (stream, _("\
13680 -mnaked-reg don't require `%%' prefix for registers\n"));
13681 fprintf (stream, _("\
13682 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13683 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13684 fprintf (stream, _("\
13685 -mshared disable branch optimization for shared code\n"));
13686 fprintf (stream, _("\
13687 -mx86-used-note=[no|yes] "));
13688 if (DEFAULT_X86_USED_NOTE)
13689 fprintf (stream, _("(default: yes)\n"));
13690 else
13691 fprintf (stream, _("(default: no)\n"));
13692 fprintf (stream, _("\
13693 generate x86 used ISA and feature properties\n"));
13694 #endif
13695 #if defined (TE_PE) || defined (TE_PEP)
13696 fprintf (stream, _("\
13697 -mbig-obj generate big object files\n"));
13698 #endif
13699 fprintf (stream, _("\
13700 -momit-lock-prefix=[no|yes] (default: no)\n\
13701 strip all lock prefixes\n"));
13702 fprintf (stream, _("\
13703 -mfence-as-lock-add=[no|yes] (default: no)\n\
13704 encode lfence, mfence and sfence as\n\
13705 lock addl $0x0, (%%{re}sp)\n"));
13706 fprintf (stream, _("\
13707 -mrelax-relocations=[no|yes] "));
13708 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13709 fprintf (stream, _("(default: yes)\n"));
13710 else
13711 fprintf (stream, _("(default: no)\n"));
13712 fprintf (stream, _("\
13713 generate relax relocations\n"));
13714 fprintf (stream, _("\
13715 -malign-branch-boundary=NUM (default: 0)\n\
13716 align branches within NUM byte boundary\n"));
13717 fprintf (stream, _("\
13718 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13719 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13720 indirect\n\
13721 specify types of branches to align\n"));
13722 fprintf (stream, _("\
13723 -malign-branch-prefix-size=NUM (default: 5)\n\
13724 align branches with NUM prefixes per instruction\n"));
13725 fprintf (stream, _("\
13726 -mbranches-within-32B-boundaries\n\
13727 align branches within 32 byte boundary\n"));
13728 fprintf (stream, _("\
13729 -mlfence-after-load=[no|yes] (default: no)\n\
13730 generate lfence after load\n"));
13731 fprintf (stream, _("\
13732 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13733 generate lfence before indirect near branch\n"));
13734 fprintf (stream, _("\
13735 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13736 generate lfence before ret\n"));
13737 fprintf (stream, _("\
13738 -mamd64 accept only AMD64 ISA [default]\n"));
13739 fprintf (stream, _("\
13740 -mintel64 accept only Intel64 ISA\n"));
13741 }
13742
13743 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13744 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13745 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13746
13747 /* Pick the target format to use. */
13748
13749 const char *
13750 i386_target_format (void)
13751 {
13752 if (!strncmp (default_arch, "x86_64", 6))
13753 {
13754 update_code_flag (CODE_64BIT, 1);
13755 if (default_arch[6] == '\0')
13756 x86_elf_abi = X86_64_ABI;
13757 else
13758 x86_elf_abi = X86_64_X32_ABI;
13759 }
13760 else if (!strcmp (default_arch, "i386"))
13761 update_code_flag (CODE_32BIT, 1);
13762 else if (!strcmp (default_arch, "iamcu"))
13763 {
13764 update_code_flag (CODE_32BIT, 1);
13765 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13766 {
13767 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13768 cpu_arch_name = "iamcu";
13769 cpu_sub_arch_name = NULL;
13770 cpu_arch_flags = iamcu_flags;
13771 cpu_arch_isa = PROCESSOR_IAMCU;
13772 cpu_arch_isa_flags = iamcu_flags;
13773 if (!cpu_arch_tune_set)
13774 {
13775 cpu_arch_tune = cpu_arch_isa;
13776 cpu_arch_tune_flags = cpu_arch_isa_flags;
13777 }
13778 }
13779 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13780 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13781 cpu_arch_name);
13782 }
13783 else
13784 as_fatal (_("unknown architecture"));
13785
13786 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13787 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13788 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13789 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13790
13791 switch (OUTPUT_FLAVOR)
13792 {
13793 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13794 case bfd_target_aout_flavour:
13795 return AOUT_TARGET_FORMAT;
13796 #endif
13797 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13798 # if defined (TE_PE) || defined (TE_PEP)
13799 case bfd_target_coff_flavour:
13800 if (flag_code == CODE_64BIT)
13801 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13802 else
13803 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13804 # elif defined (TE_GO32)
13805 case bfd_target_coff_flavour:
13806 return "coff-go32";
13807 # else
13808 case bfd_target_coff_flavour:
13809 return "coff-i386";
13810 # endif
13811 #endif
13812 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13813 case bfd_target_elf_flavour:
13814 {
13815 const char *format;
13816
13817 switch (x86_elf_abi)
13818 {
13819 default:
13820 format = ELF_TARGET_FORMAT;
13821 #ifndef TE_SOLARIS
13822 tls_get_addr = "___tls_get_addr";
13823 #endif
13824 break;
13825 case X86_64_ABI:
13826 use_rela_relocations = 1;
13827 object_64bit = 1;
13828 #ifndef TE_SOLARIS
13829 tls_get_addr = "__tls_get_addr";
13830 #endif
13831 format = ELF_TARGET_FORMAT64;
13832 break;
13833 case X86_64_X32_ABI:
13834 use_rela_relocations = 1;
13835 object_64bit = 1;
13836 #ifndef TE_SOLARIS
13837 tls_get_addr = "__tls_get_addr";
13838 #endif
13839 disallow_64bit_reloc = 1;
13840 format = ELF_TARGET_FORMAT32;
13841 break;
13842 }
13843 if (cpu_arch_isa == PROCESSOR_L1OM)
13844 {
13845 if (x86_elf_abi != X86_64_ABI)
13846 as_fatal (_("Intel L1OM is 64bit only"));
13847 return ELF_TARGET_L1OM_FORMAT;
13848 }
13849 else if (cpu_arch_isa == PROCESSOR_K1OM)
13850 {
13851 if (x86_elf_abi != X86_64_ABI)
13852 as_fatal (_("Intel K1OM is 64bit only"));
13853 return ELF_TARGET_K1OM_FORMAT;
13854 }
13855 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13856 {
13857 if (x86_elf_abi != I386_ABI)
13858 as_fatal (_("Intel MCU is 32bit only"));
13859 return ELF_TARGET_IAMCU_FORMAT;
13860 }
13861 else
13862 return format;
13863 }
13864 #endif
13865 #if defined (OBJ_MACH_O)
13866 case bfd_target_mach_o_flavour:
13867 if (flag_code == CODE_64BIT)
13868 {
13869 use_rela_relocations = 1;
13870 object_64bit = 1;
13871 return "mach-o-x86-64";
13872 }
13873 else
13874 return "mach-o-i386";
13875 #endif
13876 default:
13877 abort ();
13878 return NULL;
13879 }
13880 }
13881
13882 #endif /* OBJ_MAYBE_ more than one */
13883 \f
13884 symbolS *
13885 md_undefined_symbol (char *name)
13886 {
13887 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13888 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13889 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13890 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13891 {
13892 if (!GOT_symbol)
13893 {
13894 if (symbol_find (name))
13895 as_bad (_("GOT already in symbol table"));
13896 GOT_symbol = symbol_new (name, undefined_section,
13897 &zero_address_frag, 0);
13898 };
13899 return GOT_symbol;
13900 }
13901 return 0;
13902 }
13903
13904 /* Round up a section size to the appropriate boundary. */
13905
13906 valueT
13907 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13908 {
13909 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13910 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13911 {
13912 /* For a.out, force the section size to be aligned. If we don't do
13913 this, BFD will align it for us, but it will not write out the
13914 final bytes of the section. This may be a bug in BFD, but it is
13915 easier to fix it here since that is how the other a.out targets
13916 work. */
13917 int align;
13918
13919 align = bfd_section_alignment (segment);
13920 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13921 }
13922 #endif
13923
13924 return size;
13925 }
13926
13927 /* On the i386, PC-relative offsets are relative to the start of the
13928 next instruction. That is, the address of the offset, plus its
13929 size, since the offset is always the last part of the insn. */
13930
13931 long
13932 md_pcrel_from (fixS *fixP)
13933 {
13934 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13935 }
13936
13937 #ifndef I386COFF
13938
13939 static void
13940 s_bss (int ignore ATTRIBUTE_UNUSED)
13941 {
13942 int temp;
13943
13944 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13945 if (IS_ELF)
13946 obj_elf_section_change_hook ();
13947 #endif
13948 temp = get_absolute_expression ();
13949 subseg_set (bss_section, (subsegT) temp);
13950 demand_empty_rest_of_line ();
13951 }
13952
13953 #endif
13954
13955 /* Remember constant directive. */
13956
13957 void
13958 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13959 {
13960 if (last_insn.kind != last_insn_directive
13961 && (bfd_section_flags (now_seg) & SEC_CODE))
13962 {
13963 last_insn.seg = now_seg;
13964 last_insn.kind = last_insn_directive;
13965 last_insn.name = "constant directive";
13966 last_insn.file = as_where (&last_insn.line);
13967 if (lfence_before_ret != lfence_before_ret_none)
13968 {
13969 if (lfence_before_indirect_branch != lfence_branch_none)
13970 as_warn (_("constant directive skips -mlfence-before-ret "
13971 "and -mlfence-before-indirect-branch"));
13972 else
13973 as_warn (_("constant directive skips -mlfence-before-ret"));
13974 }
13975 else if (lfence_before_indirect_branch != lfence_branch_none)
13976 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13977 }
13978 }
13979
13980 void
13981 i386_validate_fix (fixS *fixp)
13982 {
13983 if (fixp->fx_subsy)
13984 {
13985 if (fixp->fx_subsy == GOT_symbol)
13986 {
13987 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13988 {
13989 if (!object_64bit)
13990 abort ();
13991 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13992 if (fixp->fx_tcbit2)
13993 fixp->fx_r_type = (fixp->fx_tcbit
13994 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13995 : BFD_RELOC_X86_64_GOTPCRELX);
13996 else
13997 #endif
13998 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13999 }
14000 else
14001 {
14002 if (!object_64bit)
14003 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
14004 else
14005 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
14006 }
14007 fixp->fx_subsy = 0;
14008 }
14009 }
14010 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14011 else
14012 {
14013 /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
14014 to section. Since PLT32 relocation must be against symbols,
14015 turn such PLT32 relocation into PC32 relocation. */
14016 if (fixp->fx_addsy
14017 && (fixp->fx_r_type == BFD_RELOC_386_PLT32
14018 || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
14019 && symbol_section_p (fixp->fx_addsy))
14020 fixp->fx_r_type = BFD_RELOC_32_PCREL;
14021 if (!object_64bit)
14022 {
14023 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
14024 && fixp->fx_tcbit2)
14025 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14026 }
14027 }
14028 #endif
14029 }
14030
14031 arelent *
14032 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14033 {
14034 arelent *rel;
14035 bfd_reloc_code_real_type code;
14036
14037 switch (fixp->fx_r_type)
14038 {
14039 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14040 case BFD_RELOC_SIZE32:
14041 case BFD_RELOC_SIZE64:
14042 if (S_IS_DEFINED (fixp->fx_addsy)
14043 && !S_IS_EXTERNAL (fixp->fx_addsy))
14044 {
14045 /* Resolve size relocation against local symbol to size of
14046 the symbol plus addend. */
14047 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
14048 if (fixp->fx_r_type == BFD_RELOC_SIZE32
14049 && !fits_in_unsigned_long (value))
14050 as_bad_where (fixp->fx_file, fixp->fx_line,
14051 _("symbol size computation overflow"));
14052 fixp->fx_addsy = NULL;
14053 fixp->fx_subsy = NULL;
14054 md_apply_fix (fixp, (valueT *) &value, NULL);
14055 return NULL;
14056 }
14057 #endif
14058 /* Fall through. */
14059
14060 case BFD_RELOC_X86_64_PLT32:
14061 case BFD_RELOC_X86_64_GOT32:
14062 case BFD_RELOC_X86_64_GOTPCREL:
14063 case BFD_RELOC_X86_64_GOTPCRELX:
14064 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14065 case BFD_RELOC_386_PLT32:
14066 case BFD_RELOC_386_GOT32:
14067 case BFD_RELOC_386_GOT32X:
14068 case BFD_RELOC_386_GOTOFF:
14069 case BFD_RELOC_386_GOTPC:
14070 case BFD_RELOC_386_TLS_GD:
14071 case BFD_RELOC_386_TLS_LDM:
14072 case BFD_RELOC_386_TLS_LDO_32:
14073 case BFD_RELOC_386_TLS_IE_32:
14074 case BFD_RELOC_386_TLS_IE:
14075 case BFD_RELOC_386_TLS_GOTIE:
14076 case BFD_RELOC_386_TLS_LE_32:
14077 case BFD_RELOC_386_TLS_LE:
14078 case BFD_RELOC_386_TLS_GOTDESC:
14079 case BFD_RELOC_386_TLS_DESC_CALL:
14080 case BFD_RELOC_X86_64_TLSGD:
14081 case BFD_RELOC_X86_64_TLSLD:
14082 case BFD_RELOC_X86_64_DTPOFF32:
14083 case BFD_RELOC_X86_64_DTPOFF64:
14084 case BFD_RELOC_X86_64_GOTTPOFF:
14085 case BFD_RELOC_X86_64_TPOFF32:
14086 case BFD_RELOC_X86_64_TPOFF64:
14087 case BFD_RELOC_X86_64_GOTOFF64:
14088 case BFD_RELOC_X86_64_GOTPC32:
14089 case BFD_RELOC_X86_64_GOT64:
14090 case BFD_RELOC_X86_64_GOTPCREL64:
14091 case BFD_RELOC_X86_64_GOTPC64:
14092 case BFD_RELOC_X86_64_GOTPLT64:
14093 case BFD_RELOC_X86_64_PLTOFF64:
14094 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14095 case BFD_RELOC_X86_64_TLSDESC_CALL:
14096 case BFD_RELOC_RVA:
14097 case BFD_RELOC_VTABLE_ENTRY:
14098 case BFD_RELOC_VTABLE_INHERIT:
14099 #ifdef TE_PE
14100 case BFD_RELOC_32_SECREL:
14101 #endif
14102 code = fixp->fx_r_type;
14103 break;
14104 case BFD_RELOC_X86_64_32S:
14105 if (!fixp->fx_pcrel)
14106 {
14107 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
14108 code = fixp->fx_r_type;
14109 break;
14110 }
14111 /* Fall through. */
14112 default:
14113 if (fixp->fx_pcrel)
14114 {
14115 switch (fixp->fx_size)
14116 {
14117 default:
14118 as_bad_where (fixp->fx_file, fixp->fx_line,
14119 _("can not do %d byte pc-relative relocation"),
14120 fixp->fx_size);
14121 code = BFD_RELOC_32_PCREL;
14122 break;
14123 case 1: code = BFD_RELOC_8_PCREL; break;
14124 case 2: code = BFD_RELOC_16_PCREL; break;
14125 case 4: code = BFD_RELOC_32_PCREL; break;
14126 #ifdef BFD64
14127 case 8: code = BFD_RELOC_64_PCREL; break;
14128 #endif
14129 }
14130 }
14131 else
14132 {
14133 switch (fixp->fx_size)
14134 {
14135 default:
14136 as_bad_where (fixp->fx_file, fixp->fx_line,
14137 _("can not do %d byte relocation"),
14138 fixp->fx_size);
14139 code = BFD_RELOC_32;
14140 break;
14141 case 1: code = BFD_RELOC_8; break;
14142 case 2: code = BFD_RELOC_16; break;
14143 case 4: code = BFD_RELOC_32; break;
14144 #ifdef BFD64
14145 case 8: code = BFD_RELOC_64; break;
14146 #endif
14147 }
14148 }
14149 break;
14150 }
14151
14152 if ((code == BFD_RELOC_32
14153 || code == BFD_RELOC_32_PCREL
14154 || code == BFD_RELOC_X86_64_32S)
14155 && GOT_symbol
14156 && fixp->fx_addsy == GOT_symbol)
14157 {
14158 if (!object_64bit)
14159 code = BFD_RELOC_386_GOTPC;
14160 else
14161 code = BFD_RELOC_X86_64_GOTPC32;
14162 }
14163 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14164 && GOT_symbol
14165 && fixp->fx_addsy == GOT_symbol)
14166 {
14167 code = BFD_RELOC_X86_64_GOTPC64;
14168 }
14169
14170 rel = XNEW (arelent);
14171 rel->sym_ptr_ptr = XNEW (asymbol *);
14172 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14173
14174 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14175
14176 if (!use_rela_relocations)
14177 {
14178 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14179 vtable entry to be used in the relocation's section offset. */
14180 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14181 rel->address = fixp->fx_offset;
14182 #if defined (OBJ_COFF) && defined (TE_PE)
14183 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14184 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14185 else
14186 #endif
14187 rel->addend = 0;
14188 }
14189 /* Use the rela in 64bit mode. */
14190 else
14191 {
14192 if (disallow_64bit_reloc)
14193 switch (code)
14194 {
14195 case BFD_RELOC_X86_64_DTPOFF64:
14196 case BFD_RELOC_X86_64_TPOFF64:
14197 case BFD_RELOC_64_PCREL:
14198 case BFD_RELOC_X86_64_GOTOFF64:
14199 case BFD_RELOC_X86_64_GOT64:
14200 case BFD_RELOC_X86_64_GOTPCREL64:
14201 case BFD_RELOC_X86_64_GOTPC64:
14202 case BFD_RELOC_X86_64_GOTPLT64:
14203 case BFD_RELOC_X86_64_PLTOFF64:
14204 as_bad_where (fixp->fx_file, fixp->fx_line,
14205 _("cannot represent relocation type %s in x32 mode"),
14206 bfd_get_reloc_code_name (code));
14207 break;
14208 default:
14209 break;
14210 }
14211
14212 if (!fixp->fx_pcrel)
14213 rel->addend = fixp->fx_offset;
14214 else
14215 switch (code)
14216 {
14217 case BFD_RELOC_X86_64_PLT32:
14218 case BFD_RELOC_X86_64_GOT32:
14219 case BFD_RELOC_X86_64_GOTPCREL:
14220 case BFD_RELOC_X86_64_GOTPCRELX:
14221 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14222 case BFD_RELOC_X86_64_TLSGD:
14223 case BFD_RELOC_X86_64_TLSLD:
14224 case BFD_RELOC_X86_64_GOTTPOFF:
14225 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14226 case BFD_RELOC_X86_64_TLSDESC_CALL:
14227 rel->addend = fixp->fx_offset - fixp->fx_size;
14228 break;
14229 default:
14230 rel->addend = (section->vma
14231 - fixp->fx_size
14232 + fixp->fx_addnumber
14233 + md_pcrel_from (fixp));
14234 break;
14235 }
14236 }
14237
14238 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14239 if (rel->howto == NULL)
14240 {
14241 as_bad_where (fixp->fx_file, fixp->fx_line,
14242 _("cannot represent relocation type %s"),
14243 bfd_get_reloc_code_name (code));
14244 /* Set howto to a garbage value so that we can keep going. */
14245 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14246 gas_assert (rel->howto != NULL);
14247 }
14248
14249 return rel;
14250 }
14251
14252 #include "tc-i386-intel.c"
14253
14254 void
14255 tc_x86_parse_to_dw2regnum (expressionS *exp)
14256 {
14257 int saved_naked_reg;
14258 char saved_register_dot;
14259
14260 saved_naked_reg = allow_naked_reg;
14261 allow_naked_reg = 1;
14262 saved_register_dot = register_chars['.'];
14263 register_chars['.'] = '.';
14264 allow_pseudo_reg = 1;
14265 expression_and_evaluate (exp);
14266 allow_pseudo_reg = 0;
14267 register_chars['.'] = saved_register_dot;
14268 allow_naked_reg = saved_naked_reg;
14269
14270 if (exp->X_op == O_register && exp->X_add_number >= 0)
14271 {
14272 if ((addressT) exp->X_add_number < i386_regtab_size)
14273 {
14274 exp->X_op = O_constant;
14275 exp->X_add_number = i386_regtab[exp->X_add_number]
14276 .dw2_regnum[flag_code >> 1];
14277 }
14278 else
14279 exp->X_op = O_illegal;
14280 }
14281 }
14282
14283 void
14284 tc_x86_frame_initial_instructions (void)
14285 {
14286 static unsigned int sp_regno[2];
14287
14288 if (!sp_regno[flag_code >> 1])
14289 {
14290 char *saved_input = input_line_pointer;
14291 char sp[][4] = {"esp", "rsp"};
14292 expressionS exp;
14293
14294 input_line_pointer = sp[flag_code >> 1];
14295 tc_x86_parse_to_dw2regnum (&exp);
14296 gas_assert (exp.X_op == O_constant);
14297 sp_regno[flag_code >> 1] = exp.X_add_number;
14298 input_line_pointer = saved_input;
14299 }
14300
14301 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14302 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14303 }
14304
14305 int
14306 x86_dwarf2_addr_size (void)
14307 {
14308 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14309 if (x86_elf_abi == X86_64_X32_ABI)
14310 return 4;
14311 #endif
14312 return bfd_arch_bits_per_address (stdoutput) / 8;
14313 }
14314
14315 int
14316 i386_elf_section_type (const char *str, size_t len)
14317 {
14318 if (flag_code == CODE_64BIT
14319 && len == sizeof ("unwind") - 1
14320 && strncmp (str, "unwind", 6) == 0)
14321 return SHT_X86_64_UNWIND;
14322
14323 return -1;
14324 }
14325
14326 #ifdef TE_SOLARIS
14327 void
14328 i386_solaris_fix_up_eh_frame (segT sec)
14329 {
14330 if (flag_code == CODE_64BIT)
14331 elf_section_type (sec) = SHT_X86_64_UNWIND;
14332 }
14333 #endif
14334
14335 #ifdef TE_PE
14336 void
14337 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14338 {
14339 expressionS exp;
14340
14341 exp.X_op = O_secrel;
14342 exp.X_add_symbol = symbol;
14343 exp.X_add_number = 0;
14344 emit_expr (&exp, size);
14345 }
14346 #endif
14347
14348 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14349 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14350
14351 bfd_vma
14352 x86_64_section_letter (int letter, const char **ptr_msg)
14353 {
14354 if (flag_code == CODE_64BIT)
14355 {
14356 if (letter == 'l')
14357 return SHF_X86_64_LARGE;
14358
14359 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14360 }
14361 else
14362 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14363 return -1;
14364 }
14365
14366 bfd_vma
14367 x86_64_section_word (char *str, size_t len)
14368 {
14369 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14370 return SHF_X86_64_LARGE;
14371
14372 return -1;
14373 }
14374
14375 static void
14376 handle_large_common (int small ATTRIBUTE_UNUSED)
14377 {
14378 if (flag_code != CODE_64BIT)
14379 {
14380 s_comm_internal (0, elf_common_parse);
14381 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14382 }
14383 else
14384 {
14385 static segT lbss_section;
14386 asection *saved_com_section_ptr = elf_com_section_ptr;
14387 asection *saved_bss_section = bss_section;
14388
14389 if (lbss_section == NULL)
14390 {
14391 flagword applicable;
14392 segT seg = now_seg;
14393 subsegT subseg = now_subseg;
14394
14395 /* The .lbss section is for local .largecomm symbols. */
14396 lbss_section = subseg_new (".lbss", 0);
14397 applicable = bfd_applicable_section_flags (stdoutput);
14398 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14399 seg_info (lbss_section)->bss = 1;
14400
14401 subseg_set (seg, subseg);
14402 }
14403
14404 elf_com_section_ptr = &_bfd_elf_large_com_section;
14405 bss_section = lbss_section;
14406
14407 s_comm_internal (0, elf_common_parse);
14408
14409 elf_com_section_ptr = saved_com_section_ptr;
14410 bss_section = saved_bss_section;
14411 }
14412 }
14413 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */